annotate src/coding.c @ 112288:81d8294d0c45

* coding.c (decode_coding_emacs_mule): Remove unreachable code. This is a typo left over from revno 95090 dated 2009-03-06, which fixed Bug#2370. Caught by Sun cc.
author Paul Eggert <eggert@cs.ucla.edu>
date Sun, 16 Jan 2011 18:55:28 -0800
parents ef719132ddfa
children 42e22c4f06b7
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88936
c6ed294ee664 Comment fix
Dave Love <fx@gnu.org>
parents: 88889
diff changeset
1 /* Coding system handler (conversion, detection, etc).
68651
3bd95f4f2941 Update years in copyright notice; nfc.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents: 68567
diff changeset
2 Copyright (C) 2001, 2002, 2003, 2004, 2005,
112218
376148b31b5e Add 2011 to FSF/AIST copyright years.
Glenn Morris <rgm@gnu.org>
parents: 111743
diff changeset
3 2006, 2007, 2008, 2009, 2010, 2011 Free Software Foundation, Inc.
74605
6ee41fdd69ff Update AIST copyright years.
Kenichi Handa <handa@m17n.org>
parents: 73995
diff changeset
4 Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
112218
376148b31b5e Add 2011 to FSF/AIST copyright years.
Glenn Morris <rgm@gnu.org>
parents: 111743
diff changeset
5 2005, 2006, 2007, 2008, 2009, 2010, 2011
67658
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
7 Registration Number H14PRO021
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8 Copyright (C) 2003
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9 National Institute of Advanced Industrial Science and Technology (AIST)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10 Registration Number H13PRO009
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
11
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
12 This file is part of GNU Emacs.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
13
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
14 GNU Emacs is free software: you can redistribute it and/or modify
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
15 it under the terms of the GNU General Public License as published by
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
16 the Free Software Foundation, either version 3 of the License, or
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
17 (at your option) any later version.
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
18
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
19 GNU Emacs is distributed in the hope that it will be useful,
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
20 but WITHOUT ANY WARRANTY; without even the implied warranty of
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
21 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
22 GNU General Public License for more details.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
23
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
24 You should have received a copy of the GNU General Public License
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
25 along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
26
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
27 /*** TABLE OF CONTENTS ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
28
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
29 0. General comments
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
30 1. Preamble
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
31 2. Emacs' internal format (emacs-utf-8) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
32 3. UTF-8 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
33 4. UTF-16 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
34 5. Charset-base coding systems handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
35 6. emacs-mule (old Emacs' internal format) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
36 7. ISO2022 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
37 8. Shift-JIS and BIG5 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
38 9. CCL handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
39 10. C library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
40 11. Emacs Lisp library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
41 12. Postamble
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
42
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
43 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
44
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
45 /*** 0. General comments ***
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
46
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
47
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
48 CODING SYSTEM
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
49
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
50 A coding system is an object for an encoding mechanism that contains
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
51 information about how to convert byte sequences to character
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
52 sequences and vice versa. When we say "decode", it means converting
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
53 a byte sequence of a specific coding system into a character
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
54 sequence that is represented by Emacs' internal coding system
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
55 `emacs-utf-8', and when we say "encode", it means converting a
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
56 character sequence of emacs-utf-8 to a byte sequence of a specific
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
57 coding system.
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
58
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
59 In Emacs Lisp, a coding system is represented by a Lisp symbol. In
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
60 C level, a coding system is represented by a vector of attributes
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
61 stored in the hash table Vcharset_hash_table. The conversion from
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
62 coding system symbol to attributes vector is done by looking up
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
63 Vcharset_hash_table by the symbol.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
64
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
65 Coding systems are classified into the following types depending on
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
66 the encoding mechanism. Here's a brief description of the types.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
67
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
68 o UTF-8
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
69
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
70 o UTF-16
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
71
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
72 o Charset-base coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
73
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
74 A coding system defined by one or more (coded) character sets.
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
75 Decoding and encoding are done by a code converter defined for each
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
76 character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
77
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
78 o Old Emacs internal format (emacs-mule)
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
79
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
80 The coding system adopted by old versions of Emacs (20 and 21).
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
81
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
82 o ISO2022-base coding system
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
83
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
84 The most famous coding system for multiple character sets. X's
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
85 Compound Text, various EUCs (Extended Unix Code), and coding systems
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
86 used in the Internet communication such as ISO-2022-JP are all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
87 variants of ISO2022.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
88
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
89 o SJIS (or Shift-JIS or MS-Kanji-Code)
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
90
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
91 A coding system to encode character sets: ASCII, JISX0201, and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
92 JISX0208. Widely used for PC's in Japan. Details are described in
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
93 section 8.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
94
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
95 o BIG5
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
96
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
97 A coding system to encode character sets: ASCII and Big5. Widely
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
98 used for Chinese (mainly in Taiwan and Hong Kong). Details are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
99 described in section 8. In this file, when we write "big5" (all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
100 lowercase), we mean the coding system, and when we write "Big5"
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
101 (capitalized), we mean the character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
102
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
103 o CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
104
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
105 If a user wants to decode/encode text encoded in a coding system
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
106 not listed above, he can supply a decoder and an encoder for it in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
107 CCL (Code Conversion Language) programs. Emacs executes the CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
108 program while decoding/encoding.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
109
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
110 o Raw-text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
111
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
112 A coding system for text containing raw eight-bit data. Emacs
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
113 treats each byte of source text as a character (except for
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
114 end-of-line conversion).
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
115
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
116 o No-conversion
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
117
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
118 Like raw text, but don't do end-of-line conversion.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
119
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
120
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
121 END-OF-LINE FORMAT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
122
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
123 How text end-of-line is encoded depends on operating system. For
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
124 instance, Unix's format is just one byte of LF (line-feed) code,
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
125 whereas DOS's format is two-byte sequence of `carriage-return' and
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
126 `line-feed' codes. MacOS's format is usually one byte of
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
127 `carriage-return'.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
128
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
129 Since text character encoding and end-of-line encoding are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
130 independent, any coding system described above can take any format
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
131 of end-of-line (except for no-conversion).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
132
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
133 STRUCT CODING_SYSTEM
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
134
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
135 Before using a coding system for code conversion (i.e. decoding and
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
136 encoding), we setup a structure of type `struct coding_system'.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
137 This structure keeps various information about a specific code
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
138 conversion (e.g. the location of source and destination data).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
139
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
140 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
141
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
142 /* COMMON MACROS */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
143
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
144
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
145 /*** GENERAL NOTES on `detect_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
146
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
147 These functions check if a byte sequence specified as a source in
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
148 CODING conforms to the format of XXX, and update the members of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
149 DETECT_INFO.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
150
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
151 Return 1 if the byte sequence conforms to XXX, otherwise return 0.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
152
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
153 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
154
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
155 #if 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
156 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
157 detect_coding_XXX (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
158 struct coding_detection_info *detect_info)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
159 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
160 const unsigned char *src = coding->source;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
161 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
162 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
163 int consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
164 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
165 ...;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
166
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
167 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
168 {
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
169 /* Get one byte from the source. If the source is exhausted, jump
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
170 to no_more_source:. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
171 ONE_MORE_BYTE (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
172
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
173 if (! __C_conforms_to_XXX___ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
174 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
175 if (! __C_strongly_suggests_XXX__ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
176 found = CATEGORY_MASK_XXX;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
177 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
178 /* The byte sequence is invalid for XXX. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
179 detect_info->rejected |= CATEGORY_MASK_XXX;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
180 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
181
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
182 no_more_source:
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
183 /* The source exhausted successfully. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
184 detect_info->found |= found;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
185 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
186 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
187 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
188
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
189 /*** GENERAL NOTES on `decode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
190
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
191 These functions decode a byte sequence specified as a source by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
192 CODING. The resulting multibyte text goes to a place pointed to by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
193 CODING->charbuf, the length of which should not exceed
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
194 CODING->charbuf_size;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
195
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
196 These functions set the information of original and decoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
197 CODING->consumed, CODING->consumed_char, and CODING->charbuf_used.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
198 They also set CODING->result to one of CODING_RESULT_XXX indicating
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
199 how the decoding is finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
200
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
201 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
202
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
203 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
204 static void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
205 decode_coding_XXXX (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
206 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
207 const unsigned char *src = coding->source + coding->consumed;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
208 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
209 /* SRC_BASE remembers the start position in source in each loop.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
210 The loop will be exited when there's not enough source code, or
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
211 when there's no room in CHARBUF for a decoded character. */
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
212 const unsigned char *src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
213 /* A buffer to produce decoded characters. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
214 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
215 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
216 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
217
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
218 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
219 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
220 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
221 if (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
222 /* No more room to produce a decoded character. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
223 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
224 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
225 /* Decode it. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
226 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
227
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
228 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
229 if (src_base < src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
230 && coding->mode & CODING_MODE_LAST_BLOCK)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
231 /* If the source ends by partial bytes to construct a character,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
232 treat them as eight-bit raw data. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
233 while (src_base < src_end && charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
234 *charbuf++ = *src_base++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
235 /* Remember how many bytes and characters we consumed. If the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
236 source is multibyte, the bytes and chars are not identical. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
237 coding->consumed = coding->consumed_char = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
238 /* Remember how many characters we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
239 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
240 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
241 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
242
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
243 /*** GENERAL NOTES on `encode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
244
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
245 These functions encode SRC_BYTES length text at SOURCE of Emacs'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
246 internal multibyte format by CODING. The resulting byte sequence
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
247 goes to a place pointed to by DESTINATION, the length of which
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
248 should not exceed DST_BYTES.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
249
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
250 These functions set the information of original and encoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
251 the members produced, produced_char, consumed, and consumed_char of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
252 the structure *CODING. They also set the member result to one of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
253 CODING_RESULT_XXX indicating how the encoding finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
254
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
255 DST_BYTES zero means that source area and destination area are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
256 overlapped, which means that we can produce a encoded text until it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
257 reaches at the head of not-yet-encoded source text.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
258
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
259 Below is a template of these functions. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
260 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
261 static void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
262 encode_coding_XXX (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
263 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
264 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
265 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
266 int *charbuf_end = charbuf->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
267 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
268 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
269 unsigned char *adjusted_dst_end = dst_end - _MAX_BYTES_PRODUCED_IN_LOOP_;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
270 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
271
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
272 for (; charbuf < charbuf_end && dst < adjusted_dst_end; charbuf++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
273 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
274 int c = *charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
275 /* Encode C into DST, and increment DST. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
276 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
277 label_no_more_destination:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
278 /* How many chars and bytes we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
279 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
280 coding->produced = dst - coding->destination;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
281 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
282 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
283
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
284
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
285 /*** 1. Preamble ***/
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
286
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
287 #include <config.h>
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
288 #include <stdio.h>
105669
68dd71358159 * alloc.c: Do not define struct catchtag.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105179
diff changeset
289 #include <setjmp.h>
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
290
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
291 #include "lisp.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
292 #include "buffer.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
293 #include "character.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
294 #include "charset.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
295 #include "ccl.h"
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
296 #include "composite.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
297 #include "coding.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
298 #include "window.h"
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
299 #include "frame.h"
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
300 #include "termhooks.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
301
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
302 Lisp_Object Vcoding_system_hash_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
303
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
304 Lisp_Object Qcoding_system, Qcoding_aliases, Qeol_type;
88646
d3b1f30e2267 (Qmac): Remove (duplicated) definition.
Dave Love <fx@gnu.org>
parents: 88645
diff changeset
305 Lisp_Object Qunix, Qdos;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
306 Lisp_Object Qbuffer_file_coding_system;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
307 Lisp_Object Qpost_read_conversion, Qpre_write_conversion;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
308 Lisp_Object Qdefault_char;
19612
783efd6c7c1e (Qno_conversion, Qundecided): New variables.
Kenichi Handa <handa@m17n.org>
parents: 19546
diff changeset
309 Lisp_Object Qno_conversion, Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
310 Lisp_Object Qcharset, Qiso_2022, Qutf_8, Qutf_16, Qshift_jis, Qbig5;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
311 Lisp_Object Qbig, Qlittle;
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
312 Lisp_Object Qcoding_system_history;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
313 Lisp_Object Qvalid_codes;
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
314 Lisp_Object QCcategory, QCmnemonic, QCdefault_char;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
315 Lisp_Object QCdecode_translation_table, QCencode_translation_table;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
316 Lisp_Object QCpost_read_conversion, QCpre_write_conversion;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
317 Lisp_Object QCascii_compatible_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
318
64251
3de1b955c31a * coding.c (Qprocess_argument):
Kim F. Storm <storm@cua.dk>
parents: 64084
diff changeset
319 Lisp_Object Qcall_process, Qcall_process_region;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
320 Lisp_Object Qstart_process, Qopen_network_stream;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
321 Lisp_Object Qtarget_idx;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
322
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
323 Lisp_Object Qinsufficient_source, Qinconsistent_eol, Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
324 Lisp_Object Qinterrupted, Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
325
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
326 /* If a symbol has this property, evaluate the value to define the
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
327 symbol as a coding system. */
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
328 static Lisp_Object Qcoding_system_define_form;
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
329
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
330 int coding_system_require_warning;
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
331
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
332 Lisp_Object Vselect_safe_coding_system_function;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
333
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
334 /* Mnemonic string for each format of end-of-line. */
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
335 Lisp_Object eol_mnemonic_unix, eol_mnemonic_dos, eol_mnemonic_mac;
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
336 /* Mnemonic string to indicate format of end-of-line is not yet
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
337 decided. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
338 Lisp_Object eol_mnemonic_undecided;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
339
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
340 /* Format of end-of-line decided by system. This is Qunix on
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
341 Unix and Mac, Qdos on DOS/Windows.
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
342 This has an effect only for external encoding (i.e. for output to
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
343 file and process), not for in-buffer or Lisp string encoding. */
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
344 static Lisp_Object system_eol_type;
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
345
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
346 #ifdef emacs
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
347
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
348 Lisp_Object Vcoding_system_list, Vcoding_system_alist;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
349
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
350 Lisp_Object Qcoding_system_p, Qcoding_system_error;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
351
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
352 /* Coding system emacs-mule and raw-text are for converting only
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
353 end-of-line format. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
354 Lisp_Object Qemacs_mule, Qraw_text;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
355 Lisp_Object Qutf_8_emacs;
51406
3c675181c3d8 (Qutf_8): New.
Dave Love <fx@gnu.org>
parents: 51356
diff changeset
356
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
357 /* Coding-systems are handed between Emacs Lisp programs and C internal
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
358 routines by the following three variables. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
359 /* Coding-system for reading files and receiving data from process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
360 Lisp_Object Vcoding_system_for_read;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
361 /* Coding-system for writing files and sending data to process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
362 Lisp_Object Vcoding_system_for_write;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
363 /* Coding-system actually used in the latest I/O. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
364 Lisp_Object Vlast_coding_system_used;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
365 /* Set to non-nil when an error is detected while code conversion. */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
366 Lisp_Object Vlast_code_conversion_error;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
367 /* A vector of length 256 which contains information about special
22529
d9eac134a41b Doc fixes.
Karl Heuer <kwzh@gnu.org>
parents: 22502
diff changeset
368 Latin codes (especially for dealing with Microsoft codes). */
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
369 Lisp_Object Vlatin_extra_code_table;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
370
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
371 /* Flag to inhibit code conversion of end-of-line format. */
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
372 int inhibit_eol_conversion;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
373
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
374 /* Flag to inhibit ISO2022 escape sequence detection. */
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
375 int inhibit_iso_escape_detection;
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
376
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
377 /* Flag to inhibit detection of binary files through null bytes. */
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
378 int inhibit_null_byte_detection;
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
379
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
380 /* Flag to make buffer-file-coding-system inherit from process-coding. */
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
381 int inherit_process_coding_system;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
382
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
383 /* Coding system to be used to encode text for terminal display when
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
384 terminal coding system is nil. */
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
385 struct coding_system safe_terminal_coding;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
386
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
387 Lisp_Object Vfile_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
388 Lisp_Object Vprocess_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
389 Lisp_Object Vnetwork_coding_system_alist;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
390
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
391 Lisp_Object Vlocale_coding_system;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
392
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
393 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
394
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
395 /* Flag to tell if we look up translation table on character code
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
396 conversion. */
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
397 Lisp_Object Venable_character_translation;
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
398 /* Standard translation table to look up on decoding (reading). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
399 Lisp_Object Vstandard_translation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
400 /* Standard translation table to look up on encoding (writing). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
401 Lisp_Object Vstandard_translation_table_for_encode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
402
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
403 Lisp_Object Qtranslation_table;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
404 Lisp_Object Qtranslation_table_id;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
405 Lisp_Object Qtranslation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
406 Lisp_Object Qtranslation_table_for_encode;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
407
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
408 /* Alist of charsets vs revision number. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
409 static Lisp_Object Vcharset_revision_table;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
410
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
411 /* Default coding systems used for process I/O. */
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
412 Lisp_Object Vdefault_process_coding_system;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
413
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
414 /* Char table for translating Quail and self-inserting input. */
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
415 Lisp_Object Vtranslation_table_for_input;
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
416
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
417 /* Two special coding systems. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
418 Lisp_Object Vsjis_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
419 Lisp_Object Vbig5_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
420
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
421 /* ISO2022 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
422
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
423 #define CODING_ISO_INITIAL(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
424 (XINT (AREF (AREF (CODING_ID_ATTRS ((coding)->id), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
425 coding_attr_iso_initial), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
426 reg)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
427
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
428
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
429 #define CODING_ISO_REQUEST(coding, charset_id) \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
430 (((charset_id) <= (coding)->max_charset_id \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
431 ? ((coding)->safe_charsets[charset_id] != 255 \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
432 ? (coding)->safe_charsets[charset_id] \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
433 : -1) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
434 : -1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
435
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
436
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
437 #define CODING_ISO_FLAGS(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
438 ((coding)->spec.iso_2022.flags)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
439 #define CODING_ISO_DESIGNATION(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
440 ((coding)->spec.iso_2022.current_designation[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
441 #define CODING_ISO_INVOCATION(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
442 ((coding)->spec.iso_2022.current_invocation[plane])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
443 #define CODING_ISO_SINGLE_SHIFTING(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
444 ((coding)->spec.iso_2022.single_shifting)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
445 #define CODING_ISO_BOL(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
446 ((coding)->spec.iso_2022.bol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
447 #define CODING_ISO_INVOKED_CHARSET(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
448 CODING_ISO_DESIGNATION ((coding), CODING_ISO_INVOCATION ((coding), (plane)))
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
449 #define CODING_ISO_CMP_STATUS(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
450 (&(coding)->spec.iso_2022.cmp_status)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
451 #define CODING_ISO_EXTSEGMENT_LEN(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
452 ((coding)->spec.iso_2022.ctext_extended_segment_len)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
453 #define CODING_ISO_EMBEDDED_UTF_8(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
454 ((coding)->spec.iso_2022.embedded_utf_8)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
455
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
456 /* Control characters of ISO2022. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
457 /* code */ /* function */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
458 #define ISO_CODE_LF 0x0A /* line-feed */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
459 #define ISO_CODE_CR 0x0D /* carriage-return */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
460 #define ISO_CODE_SO 0x0E /* shift-out */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
461 #define ISO_CODE_SI 0x0F /* shift-in */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
462 #define ISO_CODE_SS2_7 0x19 /* single-shift-2 for 7-bit code */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
463 #define ISO_CODE_ESC 0x1B /* escape */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
464 #define ISO_CODE_SS2 0x8E /* single-shift-2 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
465 #define ISO_CODE_SS3 0x8F /* single-shift-3 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
466 #define ISO_CODE_CSI 0x9B /* control-sequence-introducer */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
467
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
468 /* All code (1-byte) of ISO2022 is classified into one of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
469 followings. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
470 enum iso_code_class_type
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
471 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
472 ISO_control_0, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
473 0x00..0x1F and 0x7F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
474 following 5 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
475 ISO_shift_out, /* ISO_CODE_SO (0x0E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
476 ISO_shift_in, /* ISO_CODE_SI (0x0F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
477 ISO_single_shift_2_7, /* ISO_CODE_SS2_7 (0x19) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
478 ISO_escape, /* ISO_CODE_SO (0x1B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
479 ISO_control_1, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
480 0x80..0x9F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
481 following 3 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
482 ISO_single_shift_2, /* ISO_CODE_SS2 (0x8E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
483 ISO_single_shift_3, /* ISO_CODE_SS3 (0x8F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
484 ISO_control_sequence_introducer, /* ISO_CODE_CSI (0x9B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
485 ISO_0x20_or_0x7F, /* Codes of the values 0x20 or 0x7F. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
486 ISO_graphic_plane_0, /* Graphic codes in the range 0x21..0x7E. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
487 ISO_0xA0_or_0xFF, /* Codes of the values 0xA0 or 0xFF. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
488 ISO_graphic_plane_1 /* Graphic codes in the range 0xA1..0xFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
489 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
490
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
491 /** The macros CODING_ISO_FLAG_XXX defines a flag bit of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
492 `iso-flags' attribute of an iso2022 coding system. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
493
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
494 /* If set, produce long-form designation sequence (e.g. ESC $ ( A)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
495 instead of the correct short-form sequence (e.g. ESC $ A). */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
496 #define CODING_ISO_FLAG_LONG_FORM 0x0001
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
497
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
498 /* If set, reset graphic planes and registers at end-of-line to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
499 initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
500 #define CODING_ISO_FLAG_RESET_AT_EOL 0x0002
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
501
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
502 /* If set, reset graphic planes and registers before any control
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
503 characters to the initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
504 #define CODING_ISO_FLAG_RESET_AT_CNTL 0x0004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
505
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
506 /* If set, encode by 7-bit environment. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
507 #define CODING_ISO_FLAG_SEVEN_BITS 0x0008
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
508
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
509 /* If set, use locking-shift function. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
510 #define CODING_ISO_FLAG_LOCKING_SHIFT 0x0010
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
511
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
512 /* If set, use single-shift function. Overwrite
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
513 CODING_ISO_FLAG_LOCKING_SHIFT. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
514 #define CODING_ISO_FLAG_SINGLE_SHIFT 0x0020
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
515
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
516 /* If set, use designation escape sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
517 #define CODING_ISO_FLAG_DESIGNATION 0x0040
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
518
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
519 /* If set, produce revision number sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
520 #define CODING_ISO_FLAG_REVISION 0x0080
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
521
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
522 /* If set, produce ISO6429's direction specifying sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
523 #define CODING_ISO_FLAG_DIRECTION 0x0100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
524
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
525 /* If set, assume designation states are reset at beginning of line on
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
526 output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
527 #define CODING_ISO_FLAG_INIT_AT_BOL 0x0200
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
528
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
529 /* If set, designation sequence should be placed at beginning of line
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
530 on output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
531 #define CODING_ISO_FLAG_DESIGNATE_AT_BOL 0x0400
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
532
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
533 /* If set, do not encode unsafe characters on output. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
534 #define CODING_ISO_FLAG_SAFE 0x0800
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
535
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
536 /* If set, extra latin codes (128..159) are accepted as a valid code
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
537 on input. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
538 #define CODING_ISO_FLAG_LATIN_EXTRA 0x1000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
539
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
540 #define CODING_ISO_FLAG_COMPOSITION 0x2000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
541
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
542 #define CODING_ISO_FLAG_EUC_TW_SHIFT 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
543
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
544 #define CODING_ISO_FLAG_USE_ROMAN 0x8000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
545
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
546 #define CODING_ISO_FLAG_USE_OLDJIS 0x10000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
547
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
548 #define CODING_ISO_FLAG_FULL_SUPPORT 0x100000
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
549
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
550 /* A character to be produced on output if encoding of the original
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
551 character is prohibited by CODING_ISO_FLAG_SAFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
552 #define CODING_INHIBIT_CHARACTER_SUBSTITUTION '?'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
553
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
554 /* UTF-8 section */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
555 #define CODING_UTF_8_BOM(coding) \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
556 ((coding)->spec.utf_8_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
557
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
558 /* UTF-16 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
559 #define CODING_UTF_16_BOM(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
560 ((coding)->spec.utf_16.bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
561
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
562 #define CODING_UTF_16_ENDIAN(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
563 ((coding)->spec.utf_16.endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
564
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
565 #define CODING_UTF_16_SURROGATE(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
566 ((coding)->spec.utf_16.surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
567
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
568
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
569 /* CCL section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
570 #define CODING_CCL_DECODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
571 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_decoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
572 #define CODING_CCL_ENCODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
573 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_encoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
574 #define CODING_CCL_VALIDS(coding) \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
575 (SDATA (AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_valids)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
576
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
577 /* Index for each coding category in `coding_categories' */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
578
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
579 enum coding_category
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
580 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
581 coding_category_iso_7,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
582 coding_category_iso_7_tight,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
583 coding_category_iso_8_1,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
584 coding_category_iso_8_2,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
585 coding_category_iso_7_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
586 coding_category_iso_8_else,
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
587 coding_category_utf_8_auto,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
588 coding_category_utf_8_nosig,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
589 coding_category_utf_8_sig,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
590 coding_category_utf_16_auto,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
591 coding_category_utf_16_be,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
592 coding_category_utf_16_le,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
593 coding_category_utf_16_be_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
594 coding_category_utf_16_le_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
595 coding_category_charset,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
596 coding_category_sjis,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
597 coding_category_big5,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
598 coding_category_ccl,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
599 coding_category_emacs_mule,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
600 /* All above are targets of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
601 coding_category_raw_text,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
602 coding_category_undecided,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
603 coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
604 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
605
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
606 /* Definitions of flag bits used in detect_coding_XXXX. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
607 #define CATEGORY_MASK_ISO_7 (1 << coding_category_iso_7)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
608 #define CATEGORY_MASK_ISO_7_TIGHT (1 << coding_category_iso_7_tight)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
609 #define CATEGORY_MASK_ISO_8_1 (1 << coding_category_iso_8_1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
610 #define CATEGORY_MASK_ISO_8_2 (1 << coding_category_iso_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
611 #define CATEGORY_MASK_ISO_7_ELSE (1 << coding_category_iso_7_else)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
612 #define CATEGORY_MASK_ISO_8_ELSE (1 << coding_category_iso_8_else)
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
613 #define CATEGORY_MASK_UTF_8_AUTO (1 << coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
614 #define CATEGORY_MASK_UTF_8_NOSIG (1 << coding_category_utf_8_nosig)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
615 #define CATEGORY_MASK_UTF_8_SIG (1 << coding_category_utf_8_sig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
616 #define CATEGORY_MASK_UTF_16_AUTO (1 << coding_category_utf_16_auto)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
617 #define CATEGORY_MASK_UTF_16_BE (1 << coding_category_utf_16_be)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
618 #define CATEGORY_MASK_UTF_16_LE (1 << coding_category_utf_16_le)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
619 #define CATEGORY_MASK_UTF_16_BE_NOSIG (1 << coding_category_utf_16_be_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
620 #define CATEGORY_MASK_UTF_16_LE_NOSIG (1 << coding_category_utf_16_le_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
621 #define CATEGORY_MASK_CHARSET (1 << coding_category_charset)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
622 #define CATEGORY_MASK_SJIS (1 << coding_category_sjis)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
623 #define CATEGORY_MASK_BIG5 (1 << coding_category_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
624 #define CATEGORY_MASK_CCL (1 << coding_category_ccl)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
625 #define CATEGORY_MASK_EMACS_MULE (1 << coding_category_emacs_mule)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
626 #define CATEGORY_MASK_RAW_TEXT (1 << coding_category_raw_text)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
627
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
628 /* This value is returned if detect_coding_mask () find nothing other
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
629 than ASCII characters. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
630 #define CATEGORY_MASK_ANY \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
631 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
632 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
633 | CATEGORY_MASK_ISO_8_1 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
634 | CATEGORY_MASK_ISO_8_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
635 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
636 | CATEGORY_MASK_ISO_8_ELSE \
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
637 | CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
638 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
639 | CATEGORY_MASK_UTF_8_SIG \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
640 | CATEGORY_MASK_UTF_16_AUTO \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
641 | CATEGORY_MASK_UTF_16_BE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
642 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
643 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
644 | CATEGORY_MASK_UTF_16_LE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
645 | CATEGORY_MASK_CHARSET \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
646 | CATEGORY_MASK_SJIS \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
647 | CATEGORY_MASK_BIG5 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
648 | CATEGORY_MASK_CCL \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
649 | CATEGORY_MASK_EMACS_MULE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
650
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
651
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
652 #define CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
653 (CATEGORY_MASK_ISO_7 | CATEGORY_MASK_ISO_7_TIGHT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
654
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
655 #define CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
656 (CATEGORY_MASK_ISO_8_1 | CATEGORY_MASK_ISO_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
657
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
658 #define CATEGORY_MASK_ISO_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
659 (CATEGORY_MASK_ISO_7_ELSE | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
660
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
661 #define CATEGORY_MASK_ISO_ESCAPE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
662 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
663 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
664 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
665 | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
666
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
667 #define CATEGORY_MASK_ISO \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
668 ( CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
669 | CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
670 | CATEGORY_MASK_ISO_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
671
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
672 #define CATEGORY_MASK_UTF_16 \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
673 (CATEGORY_MASK_UTF_16_AUTO \
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
674 | CATEGORY_MASK_UTF_16_BE \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
675 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
676 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
677 | CATEGORY_MASK_UTF_16_LE_NOSIG)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
678
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
679 #define CATEGORY_MASK_UTF_8 \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
680 (CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
681 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
682 | CATEGORY_MASK_UTF_8_SIG)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
683
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
684 /* List of symbols `coding-category-xxx' ordered by priority. This
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
685 variable is exposed to Emacs Lisp. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
686 static Lisp_Object Vcoding_category_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
687
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
688 /* Table of coding categories (Lisp symbols). This variable is for
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
689 internal use only. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
690 static Lisp_Object Vcoding_category_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
691
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
692 /* Table of coding-categories ordered by priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
693 static enum coding_category coding_priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
694
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
695 /* Nth element is a coding context for the coding system bound to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
696 Nth coding category. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
697 static struct coding_system coding_categories[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
698
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
699 /*** Commonly used macros and functions ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
700
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
701 #ifndef min
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
702 #define min(a, b) ((a) < (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
703 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
704 #ifndef max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
705 #define max(a, b) ((a) > (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
706 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
707
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
708 #define CODING_GET_INFO(coding, attrs, charset_list) \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
709 do { \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
710 (attrs) = CODING_ID_ATTRS ((coding)->id); \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
711 (charset_list) = CODING_ATTR_CHARSET_LIST (attrs); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
712 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
713
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
714
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
715 /* Safely get one byte from the source text pointed by SRC which ends
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
716 at SRC_END, and set C to that byte. If there are not enough bytes
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
717 in the source, it jumps to `no_more_source'. If multibytep is
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
718 nonzero, and a multibyte character is found at SRC, set C to the
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
719 negative value of the character code. The caller should declare
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
720 and set these variables appropriately in advance:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
721 src, src_end, multibytep */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
722
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
723 #define ONE_MORE_BYTE(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
724 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
725 if (src == src_end) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
726 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
727 if (src_base < src) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
728 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
729 (coding, CODING_RESULT_INSUFFICIENT_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
730 goto no_more_source; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
731 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
732 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
733 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
734 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
735 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
736 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
737 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
738 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
739 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
740 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
741 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
742 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
743 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
744 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
745 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
746 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
747
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
748 /* Safely get two bytes from the source text pointed by SRC which ends
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
749 at SRC_END, and set C1 and C2 to those bytes while skipping the
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
750 heading multibyte characters. If there are not enough bytes in the
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
751 source, it jumps to `no_more_source'. If multibytep is nonzero and
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
752 a multibyte character is found for C2, set C2 to the negative value
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
753 of the character code. The caller should declare and set these
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
754 variables appropriately in advance:
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
755 src, src_end, multibytep
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
756 It is intended that this macro is used in detect_coding_utf_16. */
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
757
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
758 #define TWO_MORE_BYTES(c1, c2) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
759 do { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
760 do { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
761 if (src == src_end) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
762 goto no_more_source; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
763 c1 = *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
764 if (multibytep && (c1 & 0x80)) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
765 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
766 if ((c1 & 0xFE) == 0xC0) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
767 c1 = ((c1 & 1) << 6) | *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
768 else \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
769 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
770 src += BYTES_BY_CHAR_HEAD (c1) - 1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
771 c1 = -1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
772 } \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
773 } \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
774 } while (c1 < 0); \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
775 if (src == src_end) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
776 goto no_more_source; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
777 c2 = *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
778 if (multibytep && (c2 & 0x80)) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
779 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
780 if ((c2 & 0xFE) == 0xC0) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
781 c2 = ((c2 & 1) << 6) | *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
782 else \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
783 c2 = -1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
784 } \
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
785 } while (0)
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
786
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
787
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
788 #define ONE_MORE_BYTE_NO_CHECK(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
789 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
790 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
791 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
792 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
793 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
794 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
795 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
796 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
797 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
798 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
799 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
800 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
801 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
802 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
803 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
804 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
805
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
806
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
807 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
808 next free point, and increment PRODUCED_CHARS. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
809 assure that C is 0..127, and declare and set the variable `dst'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
810 appropriately in advance.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
811 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
812
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
813
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
814 #define EMIT_ONE_ASCII_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
815 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
816 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
817 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
818 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
819
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
820
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
821 /* Like EMIT_ONE_ASCII_BYTE but store two bytes; C1 and C2. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
822
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
823 #define EMIT_TWO_ASCII_BYTES(c1, c2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
824 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
825 produced_chars += 2; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
826 *dst++ = (c1), *dst++ = (c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
827 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
828
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
829
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
830 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
831 next free point, and increment PRODUCED_CHARS. If MULTIBYTEP is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
832 nonzero, store in an appropriate multibyte from. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
833 declare and set the variables `dst' and `multibytep' appropriately
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
834 in advance. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
835
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
836 #define EMIT_ONE_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
837 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
838 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
839 if (multibytep) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
840 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
841 int ch = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
842 if (ch >= 0x80) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
843 ch = BYTE8_TO_CHAR (ch); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
844 CHAR_STRING_ADVANCE (ch, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
845 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
846 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
847 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
848 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
849
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
850
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
851 /* Like EMIT_ONE_BYTE, but emit two bytes; C1 and C2. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
852
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
853 #define EMIT_TWO_BYTES(c1, c2) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
854 do { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
855 produced_chars += 2; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
856 if (multibytep) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
857 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
858 int ch; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
859 \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
860 ch = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
861 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
862 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
863 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
864 ch = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
865 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
866 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
867 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
868 } \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
869 else \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
870 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
871 *dst++ = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
872 *dst++ = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
873 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
874 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
875
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
876
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
877 #define EMIT_THREE_BYTES(c1, c2, c3) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
878 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
879 EMIT_ONE_BYTE (c1); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
880 EMIT_TWO_BYTES (c2, c3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
881 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
882
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
883
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
884 #define EMIT_FOUR_BYTES(c1, c2, c3, c4) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
885 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
886 EMIT_TWO_BYTES (c1, c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
887 EMIT_TWO_BYTES (c3, c4); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
888 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
889
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
890
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
891 /* Prototypes for static functions. */
109100
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
892 static void record_conversion_result (struct coding_system *coding,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
893 enum coding_result_code result);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
894 static int detect_coding_utf_8 (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
895 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
896 static void decode_coding_utf_8 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
897 static int encode_coding_utf_8 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
898
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
899 static int detect_coding_utf_16 (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
900 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
901 static void decode_coding_utf_16 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
902 static int encode_coding_utf_16 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
903
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
904 static int detect_coding_iso_2022 (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
905 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
906 static void decode_coding_iso_2022 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
907 static int encode_coding_iso_2022 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
908
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
909 static int detect_coding_emacs_mule (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
910 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
911 static void decode_coding_emacs_mule (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
912 static int encode_coding_emacs_mule (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
913
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
914 static int detect_coding_sjis (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
915 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
916 static void decode_coding_sjis (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
917 static int encode_coding_sjis (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
918
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
919 static int detect_coding_big5 (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
920 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
921 static void decode_coding_big5 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
922 static int encode_coding_big5 (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
923
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
924 static int detect_coding_ccl (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
925 struct coding_detection_info *info);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
926 static void decode_coding_ccl (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
927 static int encode_coding_ccl (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
928
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
929 static void decode_coding_raw_text (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
930 static int encode_coding_raw_text (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
931
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
932 static void coding_set_source (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
933 static void coding_set_destination (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
934 static void coding_alloc_by_realloc (struct coding_system *, EMACS_INT);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
935 static void coding_alloc_by_making_gap (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
936 EMACS_INT, EMACS_INT);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
937 static unsigned char *alloc_destination (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
938 EMACS_INT, unsigned char *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
939 static void setup_iso_safe_charsets (Lisp_Object);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
940 static unsigned char *encode_designation_at_bol (struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
941 int *, int *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
942 unsigned char *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
943 static int detect_eol (const unsigned char *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
944 EMACS_INT, enum coding_category);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
945 static Lisp_Object adjust_coding_eol_type (struct coding_system *, int);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
946 static void decode_eol (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
947 static Lisp_Object get_translation_table (Lisp_Object, int, int *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
948 static Lisp_Object get_translation (Lisp_Object, int *, int *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
949 static int produce_chars (struct coding_system *, Lisp_Object, int);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
950 static INLINE void produce_charset (struct coding_system *, int *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
951 EMACS_INT);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
952 static void produce_annotation (struct coding_system *, EMACS_INT);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
953 static int decode_coding (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
954 static INLINE int *handle_composition_annotation (EMACS_INT, EMACS_INT,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
955 struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
956 int *, EMACS_INT *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
957 static INLINE int *handle_charset_annotation (EMACS_INT, EMACS_INT,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
958 struct coding_system *,
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
959 int *, EMACS_INT *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
960 static void consume_chars (struct coding_system *, Lisp_Object, int);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
961 static int encode_coding (struct coding_system *);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
962 static Lisp_Object make_conversion_work_buffer (int);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
963 static Lisp_Object code_conversion_restore (Lisp_Object);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
964 static INLINE int char_encodable_p (int, Lisp_Object);
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
965 static Lisp_Object make_subsidiaries (Lisp_Object);
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
966
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
967 static void
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
968 record_conversion_result (struct coding_system *coding,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
969 enum coding_result_code result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
970 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
971 coding->result = result;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
972 switch (result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
973 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
974 case CODING_RESULT_INSUFFICIENT_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
975 Vlast_code_conversion_error = Qinsufficient_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
976 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
977 case CODING_RESULT_INCONSISTENT_EOL:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
978 Vlast_code_conversion_error = Qinconsistent_eol;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
979 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
980 case CODING_RESULT_INVALID_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
981 Vlast_code_conversion_error = Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
982 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
983 case CODING_RESULT_INTERRUPT:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
984 Vlast_code_conversion_error = Qinterrupted;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
985 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
986 case CODING_RESULT_INSUFFICIENT_MEM:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
987 Vlast_code_conversion_error = Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
988 break;
107174
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
989 case CODING_RESULT_INSUFFICIENT_DST:
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
990 /* Don't record this error in Vlast_code_conversion_error
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
991 because it happens just temporarily and is resolved when the
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
992 whole conversion is finished. */
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
993 break;
103133
2f7395806731 (record_conversion_result): Don't modify
Andreas Schwab <schwab@linux-m68k.org>
parents: 103052
diff changeset
994 case CODING_RESULT_SUCCESS:
2f7395806731 (record_conversion_result): Don't modify
Andreas Schwab <schwab@linux-m68k.org>
parents: 103052
diff changeset
995 break;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
996 default:
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
997 Vlast_code_conversion_error = intern ("Unknown error");
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
998 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
999 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1000
107321
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
1001 /* This wrapper macro is used to preserve validity of pointers into
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
1002 buffer text across calls to decode_char, which could cause
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
1003 relocation of buffers if it loads a charset map, because loading a
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
1004 charset map allocates large structures. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1005 #define CODING_DECODE_CHAR(coding, src, src_base, src_end, charset, code, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1006 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1007 charset_map_loaded = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1008 c = DECODE_CHAR (charset, code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1009 if (charset_map_loaded) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1010 { \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1011 const unsigned char *orig = coding->source; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1012 EMACS_INT offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1013 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1014 coding_set_source (coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1015 offset = coding->source - orig; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1016 src += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1017 src_base += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1018 src_end += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1019 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1020 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1021
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1022
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1023 /* If there are at least BYTES length of room at dst, allocate memory
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1024 for coding->destination and update dst and dst_end. We don't have
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1025 to take care of coding->source which will be relocated. It is
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1026 handled by calling coding_set_source in encode_coding. */
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1027
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1028 #define ASSURE_DESTINATION(bytes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1029 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1030 if (dst + (bytes) >= dst_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1031 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1032 int more_bytes = charbuf_end - charbuf + (bytes); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1033 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1034 dst = alloc_destination (coding, more_bytes, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1035 dst_end = coding->destination + coding->dst_bytes; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1036 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1037 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1038
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1039
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1040 /* Store multibyte form of the character C in P, and advance P to the
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1041 end of the multibyte form. This is like CHAR_STRING_ADVANCE but it
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1042 never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1043
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1044 #define CHAR_STRING_ADVANCE_NO_UNIFY(c, p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1045 do { \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1046 if ((c) <= MAX_1_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1047 *(p)++ = (c); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1048 else if ((c) <= MAX_2_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1049 *(p)++ = (0xC0 | ((c) >> 6)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1050 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1051 else if ((c) <= MAX_3_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1052 *(p)++ = (0xE0 | ((c) >> 12)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1053 *(p)++ = (0x80 | (((c) >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1054 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1055 else if ((c) <= MAX_4_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1056 *(p)++ = (0xF0 | (c >> 18)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1057 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1058 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1059 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1060 else if ((c) <= MAX_5_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1061 *(p)++ = 0xF8, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1062 *(p)++ = (0x80 | ((c >> 18) & 0x0F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1063 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1064 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1065 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1066 else \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1067 (p) += BYTE8_STRING ((c) - 0x3FFF80, p); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1068 } while (0)
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1069
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1070
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1071 /* Return the character code of character whose multibyte form is at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1072 P, and advance P to the end of the multibyte form. This is like
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1073 STRING_CHAR_ADVANCE, but it never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1074
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1075 #define STRING_CHAR_ADVANCE_NO_UNIFY(p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1076 (!((p)[0] & 0x80) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1077 ? *(p)++ \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1078 : ! ((p)[0] & 0x20) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1079 ? ((p) += 2, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1080 ((((p)[-2] & 0x1F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1081 | ((p)[-1] & 0x3F) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1082 | ((unsigned char) ((p)[-2]) < 0xC2 ? 0x3FFF80 : 0))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1083 : ! ((p)[0] & 0x10) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1084 ? ((p) += 3, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1085 ((((p)[-3] & 0x0F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1086 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1087 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1088 : ! ((p)[0] & 0x08) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1089 ? ((p) += 4, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1090 ((((p)[-4] & 0xF) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1091 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1092 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1093 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1094 : ((p) += 5, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1095 ((((p)[-4] & 0x3F) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1096 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1097 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1098 | ((p)[-1] & 0x3F))))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1099
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1101 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1102 coding_set_source (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1103 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1104 if (BUFFERP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1105 {
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1106 struct buffer *buf = XBUFFER (coding->src_object);
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1107
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1108 if (coding->src_pos < 0)
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1109 coding->source = BUF_GAP_END_ADDR (buf) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1110 else
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1111 coding->source = BUF_BYTE_ADDRESS (buf, coding->src_pos_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1112 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1113 else if (STRINGP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1114 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1115 coding->source = SDATA (coding->src_object) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1116 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1117 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1118 /* Otherwise, the source is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1119 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1120 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1121 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1122
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1123 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1124 coding_set_destination (struct coding_system *coding)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1125 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1126 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1127 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1128 if (coding->src_pos < 0)
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1129 {
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1130 coding->destination = BEG_ADDR + coding->dst_pos_byte - BEG_BYTE;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1131 coding->dst_bytes = (GAP_END_ADDR
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1132 - (coding->src_bytes - coding->consumed)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1133 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1134 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1135 else
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1136 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1137 /* We are sure that coding->dst_pos_byte is before the gap
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1138 of the buffer. */
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1139 coding->destination = (BUF_BEG_ADDR (XBUFFER (coding->dst_object))
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1140 + coding->dst_pos_byte - BEG_BYTE);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1141 coding->dst_bytes = (BUF_GAP_END_ADDR (XBUFFER (coding->dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1142 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1143 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1144 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1145 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1146 /* Otherwise, the destination is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1147 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1148 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1149 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1150
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1151
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1152 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1153 coding_alloc_by_realloc (struct coding_system *coding, EMACS_INT bytes)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1154 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1155 coding->destination = (unsigned char *) xrealloc (coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1156 coding->dst_bytes + bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1157 coding->dst_bytes += bytes;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1158 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1159
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1160 static void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1161 coding_alloc_by_making_gap (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1162 EMACS_INT gap_head_used, EMACS_INT bytes)
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1163 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1164 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1165 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1166 /* The gap may contain the produced data at the head and not-yet
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1167 consumed data at the tail. To preserve those data, we at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1168 first make the gap size to zero, then increase the gap
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1169 size. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1170 EMACS_INT add = GAP_SIZE;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1171
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1172 GPT += gap_head_used, GPT_BYTE += gap_head_used;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1173 GAP_SIZE = 0; ZV += add; Z += add; ZV_BYTE += add; Z_BYTE += add;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1174 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1175 GAP_SIZE += add; ZV -= add; Z -= add; ZV_BYTE -= add; Z_BYTE -= add;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1176 GPT -= gap_head_used, GPT_BYTE -= gap_head_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1177 }
90292
697c08d95af7 Cancel incorrect synching with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90291
diff changeset
1178 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1179 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1180 Lisp_Object this_buffer;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1181
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1182 this_buffer = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1183 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1184 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1185 set_buffer_internal (XBUFFER (this_buffer));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1186 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1187 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1188
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1189
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1190 static unsigned char *
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1191 alloc_destination (struct coding_system *coding, EMACS_INT nbytes,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1192 unsigned char *dst)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1193 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1194 EMACS_INT offset = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1195
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1196 if (BUFFERP (coding->dst_object))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1197 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1198 struct buffer *buf = XBUFFER (coding->dst_object);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1199
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1200 coding_alloc_by_making_gap (coding, dst - BUF_GPT_ADDR (buf), nbytes);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1201 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1202 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1203 coding_alloc_by_realloc (coding, nbytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1204 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1205 dst = coding->destination + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1206 return dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1207 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1208
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1209 /** Macros for annotations. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1210
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1211 /* An annotation data is stored in the array coding->charbuf in this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1212 format:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1213 [ -LENGTH ANNOTATION_MASK NCHARS ... ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1214 LENGTH is the number of elements in the annotation.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1215 ANNOTATION_MASK is one of CODING_ANNOTATE_XXX_MASK.
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1216 NCHARS is the number of characters in the text annotated.
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1217
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1218 The format of the following elements depend on ANNOTATION_MASK.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1219
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1220 In the case of CODING_ANNOTATE_COMPOSITION_MASK, these elements
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1221 follows:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1222 ... NBYTES METHOD [ COMPOSITION-COMPONENTS ... ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1223
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1224 NBYTES is the number of bytes specified in the header part of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1225 old-style emacs-mule encoding, or 0 for the other kind of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1226 composition.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1227
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1228 METHOD is one of enum composition_method.
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1229
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
1230 Optional COMPOSITION-COMPONENTS are characters and composition
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1231 rules.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1232
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1233 In the case of CODING_ANNOTATE_CHARSET_MASK, one element CHARSET-ID
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1234 follows.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1235
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1236 If ANNOTATION_MASK is 0, this annotation is just a space holder to
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1237 recover from an invalid annotation, and should be skipped by
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1238 produce_annotation. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1239
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1240 /* Maximum length of the header of annotation data. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1241 #define MAX_ANNOTATION_LENGTH 5
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1242
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1243 #define ADD_ANNOTATION_DATA(buf, len, mask, nchars) \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1244 do { \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1245 *(buf)++ = -(len); \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1246 *(buf)++ = (mask); \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1247 *(buf)++ = (nchars); \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1248 coding->annotated = 1; \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1249 } while (0);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1250
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1251 #define ADD_COMPOSITION_DATA(buf, nchars, nbytes, method) \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1252 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1253 ADD_ANNOTATION_DATA (buf, 5, CODING_ANNOTATE_COMPOSITION_MASK, nchars); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1254 *buf++ = nbytes; \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1255 *buf++ = method; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1256 } while (0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1257
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1258
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1259 #define ADD_CHARSET_DATA(buf, nchars, id) \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1260 do { \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1261 ADD_ANNOTATION_DATA (buf, 4, CODING_ANNOTATE_CHARSET_MASK, nchars); \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1262 *buf++ = id; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1263 } while (0)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1264
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1265
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1266 /*** 2. Emacs' internal format (emacs-utf-8) ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1267
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1268
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1269
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1270
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1271 /*** 3. UTF-8 ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1272
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1273 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1274 Check if a text is encoded in UTF-8. If it is, return 1, else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1275 return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1276
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1277 #define UTF_8_1_OCTET_P(c) ((c) < 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1278 #define UTF_8_EXTRA_OCTET_P(c) (((c) & 0xC0) == 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1279 #define UTF_8_2_OCTET_LEADING_P(c) (((c) & 0xE0) == 0xC0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1280 #define UTF_8_3_OCTET_LEADING_P(c) (((c) & 0xF0) == 0xE0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1281 #define UTF_8_4_OCTET_LEADING_P(c) (((c) & 0xF8) == 0xF0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1282 #define UTF_8_5_OCTET_LEADING_P(c) (((c) & 0xFC) == 0xF8)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1283
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1284 #define UTF_BOM 0xFEFF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1285 #define UTF_8_BOM_1 0xEF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1286 #define UTF_8_BOM_2 0xBB
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1287 #define UTF_8_BOM_3 0xBF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1288
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1289 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1290 detect_coding_utf_8 (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1291 struct coding_detection_info *detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1292 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1293 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1294 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1295 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1296 int consumed_chars = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1297 int bom_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1298 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1299
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1300 detect_info->checked |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1301 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1302 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1303
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1304 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1305 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1306 int c, c1, c2, c3, c4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1307
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1308 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1309 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1310 if (c < 0 || UTF_8_1_OCTET_P (c))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1311 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1312 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1313 if (c1 < 0 || ! UTF_8_EXTRA_OCTET_P (c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1314 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1315 if (UTF_8_2_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1316 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1317 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1318 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1319 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1320 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1321 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1322 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1323 if (UTF_8_3_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1324 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1325 found = 1;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1326 if (src_base == coding->source
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1327 && c == UTF_8_BOM_1 && c1 == UTF_8_BOM_2 && c2 == UTF_8_BOM_3)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1328 bom_found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1329 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1330 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1331 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1332 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1333 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1334 if (UTF_8_4_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1335 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1336 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1337 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1338 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1339 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1340 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1341 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1342 if (UTF_8_5_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1343 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1344 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1345 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1346 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1347 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1348 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1349 detect_info->rejected |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1350 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1351
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1352 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1353 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1354 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1355 detect_info->rejected |= CATEGORY_MASK_UTF_8;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1356 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1357 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1358 if (bom_found)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1359 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1360 /* The first character 0xFFFE doesn't necessarily mean a BOM. */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1361 detect_info->found |= CATEGORY_MASK_UTF_8_SIG | CATEGORY_MASK_UTF_8_NOSIG;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1362 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1363 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1364 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1365 detect_info->rejected |= CATEGORY_MASK_UTF_8_SIG;
96571
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1366 if (found)
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1367 detect_info->found |= CATEGORY_MASK_UTF_8_NOSIG;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1368 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1369 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1370 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1371
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1372
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1373 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1374 decode_coding_utf_8 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1375 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1376 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1377 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1378 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1379 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1380 int *charbuf_end = coding->charbuf + coding->charbuf_size;
100133
bca35d7cb3ac (decode_coding_utf_8): Likewise.
Kenichi Handa <handa@m17n.org>
parents: 100131
diff changeset
1381 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1382 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1383 enum utf_bom_type bom = CODING_UTF_8_BOM (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1384 Lisp_Object attr, charset_list;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1385 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1386 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1387 int byte_after_cr = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1388
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1389 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1390
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1391 if (bom != utf_without_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1392 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1393 int c1, c2, c3;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1394
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1395 src_base = src;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1396 ONE_MORE_BYTE (c1);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1397 if (! UTF_8_3_OCTET_LEADING_P (c1))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1398 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1399 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1400 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1401 ONE_MORE_BYTE (c2);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1402 if (! UTF_8_EXTRA_OCTET_P (c2))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1403 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1404 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1405 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1406 ONE_MORE_BYTE (c3);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1407 if (! UTF_8_EXTRA_OCTET_P (c3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1408 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1409 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1410 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1411 if ((c1 != UTF_8_BOM_1)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1412 || (c2 != UTF_8_BOM_2) || (c3 != UTF_8_BOM_3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1413 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1414 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1415 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1416 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1417 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1418 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1419 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1420 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1421
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1422 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1423 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1424 int c, c1, c2, c3, c4, c5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1425
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1426 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1427 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1428
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1429 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1430 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1431 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1432 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1433 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1434 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1435
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1436 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1437 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1438 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1439 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1440 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1441 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1442 c = - c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1443 }
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
1444 else if (UTF_8_1_OCTET_P (c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1445 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1446 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1447 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1448 c = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1449 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1450 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1451 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1452 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1453 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1454 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1455 if (UTF_8_2_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1456 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1457 c = ((c1 & 0x1F) << 6) | (c2 & 0x3F);
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1458 /* Reject overlong sequences here and below. Encoders
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1459 producing them are incorrect, they can be misleading,
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1460 and they mess up read/write invariance. */
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1461 if (c < 128)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1462 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1463 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1464 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1465 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1466 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1467 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1468 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1469 if (UTF_8_3_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1470 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1471 c = (((c1 & 0xF) << 12)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1472 | ((c2 & 0x3F) << 6) | (c3 & 0x3F));
89184
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1473 if (c < 0x800
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1474 || (c >= 0xd800 && c < 0xe000)) /* surrogates (invalid) */
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1475 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1476 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1477 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1478 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1479 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1480 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1481 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1482 if (UTF_8_4_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1483 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1484 c = (((c1 & 0x7) << 18) | ((c2 & 0x3F) << 12)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1485 | ((c3 & 0x3F) << 6) | (c4 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1486 if (c < 0x10000)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1487 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1488 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1489 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1490 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1491 ONE_MORE_BYTE (c5);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1492 if (c5 < 0 || ! UTF_8_EXTRA_OCTET_P (c5))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1493 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1494 if (UTF_8_5_OCTET_LEADING_P (c1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1495 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1496 c = (((c1 & 0x3) << 24) | ((c2 & 0x3F) << 18)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1497 | ((c3 & 0x3F) << 12) | ((c4 & 0x3F) << 6)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1498 | (c5 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1499 if ((c > MAX_CHAR) || (c < 0x200000))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1500 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1501 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1502 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1503 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1504 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1505 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1506 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1507 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1508
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1509 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1510 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1511
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1512 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1513 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1514 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1515 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1516 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1517 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1518 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1519
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1520 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1521 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1522 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1523 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1524 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1525
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1526
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1527 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1528 encode_coding_utf_8 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1529 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1530 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1531 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1532 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1533 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1534 unsigned char *dst_end = coding->destination + coding->dst_bytes;
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1535 int produced_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1536 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1537
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1538 if (CODING_UTF_8_BOM (coding) == utf_with_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1539 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1540 ASSURE_DESTINATION (3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1541 EMIT_THREE_BYTES (UTF_8_BOM_1, UTF_8_BOM_2, UTF_8_BOM_3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1542 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1543 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1544
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1545 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1546 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1547 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1548
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1549 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1550 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1551 unsigned char str[MAX_MULTIBYTE_LENGTH], *p, *pend = str;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1552
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1553 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1554 c = *charbuf++;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1555 if (CHAR_BYTE8_P (c))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1556 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1557 c = CHAR_TO_BYTE8 (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1558 EMIT_ONE_BYTE (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1559 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1560 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1561 {
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1562 CHAR_STRING_ADVANCE_NO_UNIFY (c, pend);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1563 for (p = str; p < pend; p++)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1564 EMIT_ONE_BYTE (*p);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1565 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1566 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1567 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1568 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1569 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1570 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1571
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1572 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1573 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1574 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1575 c = *charbuf++;
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1576 if (CHAR_BYTE8_P (c))
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1577 *dst++ = CHAR_TO_BYTE8 (c);
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1578 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1579 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1580 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1581 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1582 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1583 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1584 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1585 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1586 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1587 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1588
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1589
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1590 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1591 Check if a text is encoded in one of UTF-16 based coding systems.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1592 If it is, return 1, else return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1593
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1594 #define UTF_16_HIGH_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1595 (((val) & 0xFC00) == 0xD800)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1596
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1597 #define UTF_16_LOW_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1598 (((val) & 0xFC00) == 0xDC00)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1599
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1600 #define UTF_16_INVALID_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1601 (((val) == 0xFFFE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1602 || ((val) == 0xFFFF) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1603 || UTF_16_LOW_SURROGATE_P (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1604
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1605
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1606 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1607 detect_coding_utf_16 (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1608 struct coding_detection_info *detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1609 {
111997
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
1610 const unsigned char *src = coding->source;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1611 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1612 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1613 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1614
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1615 detect_info->checked |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1616 if (coding->mode & CODING_MODE_LAST_BLOCK
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1617 && (coding->src_chars & 1))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1618 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1619 detect_info->rejected |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1620 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1621 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1622
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1623 TWO_MORE_BYTES (c1, c2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1624 if ((c1 == 0xFF) && (c2 == 0xFE))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1625 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1626 detect_info->found |= (CATEGORY_MASK_UTF_16_LE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1627 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1628 detect_info->rejected |= (CATEGORY_MASK_UTF_16_BE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1629 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1630 | CATEGORY_MASK_UTF_16_LE_NOSIG);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1631 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1632 else if ((c1 == 0xFE) && (c2 == 0xFF))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1633 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1634 detect_info->found |= (CATEGORY_MASK_UTF_16_BE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1635 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1636 detect_info->rejected |= (CATEGORY_MASK_UTF_16_LE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1637 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1638 | CATEGORY_MASK_UTF_16_LE_NOSIG);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1639 }
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
1640 else if (c2 < 0)
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1641 {
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1642 detect_info->rejected |= CATEGORY_MASK_UTF_16;
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1643 return 0;
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1644 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1645 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1646 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1647 /* We check the dispersion of Eth and Oth bytes where E is even and
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1648 O is odd. If both are high, we assume binary data.*/
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1649 unsigned char e[256], o[256];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1650 unsigned e_num = 1, o_num = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1651
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1652 memset (e, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1653 memset (o, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1654 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1655 o[c2] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1656
103442
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1657 detect_info->rejected |= (CATEGORY_MASK_UTF_16_AUTO
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1658 |CATEGORY_MASK_UTF_16_BE
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1659 | CATEGORY_MASK_UTF_16_LE);
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1660
103448
73e7271dee09 (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103442
diff changeset
1661 while ((detect_info->rejected & CATEGORY_MASK_UTF_16)
73e7271dee09 (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103442
diff changeset
1662 != CATEGORY_MASK_UTF_16)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1663 {
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1664 TWO_MORE_BYTES (c1, c2);
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
1665 if (c2 < 0)
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1666 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1667 if (! e[c1])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1668 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1669 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1670 e_num++;
103442
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1671 if (e_num >= 128)
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1672 detect_info->rejected |= CATEGORY_MASK_UTF_16_BE_NOSIG;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1673 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1674 if (! o[c2])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1675 {
103435
45564d023acc (detect_coding_utf_16): Fix typo counting odd bytes.
Andreas Schwab <schwab@linux-m68k.org>
parents: 103306
diff changeset
1676 o[c2] = 1;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1677 o_num++;
103442
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1678 if (o_num >= 128)
db4ec1a977bd (detect_coding_utf_16): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 103441
diff changeset
1679 detect_info->rejected |= CATEGORY_MASK_UTF_16_LE_NOSIG;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1680 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1681 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1682 return 0;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1683 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1684
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1685 no_more_source:
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1686 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1687 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1688
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1689 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1690 decode_coding_utf_16 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1691 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1692 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1693 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1694 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1695 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1696 /* We may produces at most 3 chars in one loop. */
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1697 int *charbuf_end = coding->charbuf + coding->charbuf_size - 2;
100131
0e4115b39b5d (decode_coding_utf_16): Initialize consumed_chars_base
Kenichi Handa <handa@m17n.org>
parents: 99753
diff changeset
1698 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1699 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1700 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1701 enum utf_16_endian_type endian = CODING_UTF_16_ENDIAN (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1702 int surrogate = CODING_UTF_16_SURROGATE (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1703 Lisp_Object attr, charset_list;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1704 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1705 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1706 int byte_after_cr1 = -1, byte_after_cr2 = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1707
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1708 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1709
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1710 if (bom == utf_with_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1711 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1712 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1713
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1714 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1715 ONE_MORE_BYTE (c1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1716 ONE_MORE_BYTE (c2);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1717 c = (c1 << 8) | c2;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1718
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1719 if (endian == utf_16_big_endian
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1720 ? c != 0xFEFF : c != 0xFFFE)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1721 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1722 /* The first two bytes are not BOM. Treat them as bytes
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1723 for a normal character. */
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1724 src = src_base;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1725 coding->errors++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1726 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1727 CODING_UTF_16_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1728 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1729 else if (bom == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1730 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1731 /* We have already tried to detect BOM and failed in
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1732 detect_coding. */
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1733 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1734 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1735
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1736 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1737 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1738 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1739
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1740 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1741 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1742
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1743 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1744 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1745 if (byte_after_cr1 >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1746 src_base -= 2;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1747 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1748 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1749
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1750 if (byte_after_cr1 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1751 c1 = byte_after_cr1, byte_after_cr1 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1752 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1753 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1754 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1755 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1756 *charbuf++ = -c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1757 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1758 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1759 if (byte_after_cr2 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1760 c2 = byte_after_cr2, byte_after_cr2 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1761 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1762 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1763 if (c2 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1764 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1765 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1766 *charbuf++ = -c2;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1767 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1768 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1769 c = (endian == utf_16_big_endian
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1770 ? ((c1 << 8) | c2) : ((c2 << 8) | c1));
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1771
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1772 if (surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1773 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1774 if (! UTF_16_LOW_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1775 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1776 if (endian == utf_16_big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1777 c1 = surrogate >> 8, c2 = surrogate & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1778 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1779 c1 = surrogate & 0xFF, c2 = surrogate >> 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1780 *charbuf++ = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1781 *charbuf++ = c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1782 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1783 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1784 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1785 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1786 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1787 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1788 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1789 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1790 c = ((surrogate - 0xD800) << 10) | (c - 0xDC00);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1791 CODING_UTF_16_SURROGATE (coding) = surrogate = 0;
89842
b5f22f538c1f (decode_coding_utf_16): Fix handling of surrogate pare.
Kenichi Handa <handa@m17n.org>
parents: 89780
diff changeset
1792 *charbuf++ = 0x10000 + c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1793 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1794 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1795 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1796 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1797 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1798 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1799 else
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1800 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1801 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1802 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1803 ONE_MORE_BYTE (byte_after_cr1);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1804 ONE_MORE_BYTE (byte_after_cr2);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1805 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1806 *charbuf++ = c;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1807 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1808 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1809 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1810
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1811 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1812 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1813 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1814 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1815 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1816
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1817 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
1818 encode_coding_utf_16 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1819 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1820 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1821 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1822 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1823 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1824 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1825 int safe_room = 8;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1826 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1827 int big_endian = CODING_UTF_16_ENDIAN (coding) == utf_16_big_endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1828 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1829 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1830 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1831
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1832 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1833
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1834 if (bom != utf_without_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1835 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1836 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1837 if (big_endian)
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1838 EMIT_TWO_BYTES (0xFE, 0xFF);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1839 else
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1840 EMIT_TWO_BYTES (0xFF, 0xFE);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1841 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1842 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1843
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1844 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1845 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1846 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1847 c = *charbuf++;
104636
bc74846b9a54 (encode_coding_utf_16): Fix checking of an Unicode character.
Kenichi Handa <handa@m17n.org>
parents: 103762
diff changeset
1848 if (c > MAX_UNICODE_CHAR)
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1849 c = coding->default_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1850
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1851 if (c < 0x10000)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1852 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1853 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1854 EMIT_TWO_BYTES (c >> 8, c & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1855 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1856 EMIT_TWO_BYTES (c & 0xFF, c >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1857 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1858 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1859 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1860 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1861
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1862 c -= 0x10000;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1863 c1 = (c >> 10) + 0xD800;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1864 c2 = (c & 0x3FF) + 0xDC00;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1865 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1866 EMIT_FOUR_BYTES (c1 >> 8, c1 & 0xFF, c2 >> 8, c2 & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1867 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1868 EMIT_FOUR_BYTES (c1 & 0xFF, c1 >> 8, c2 & 0xFF, c2 >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1869 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1870 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1871 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1872 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1873 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1874 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1875 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1876
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1877
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1878 /*** 6. Old Emacs' internal format (emacs-mule) ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1879
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1880 /* Emacs' internal format for representation of multiple character
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1881 sets is a kind of multi-byte encoding, i.e. characters are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1882 represented by variable-length sequences of one-byte codes.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1883
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1884 ASCII characters and control characters (e.g. `tab', `newline') are
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1885 represented by one-byte sequences which are their ASCII codes, in
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1886 the range 0x00 through 0x7F.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1887
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1888 8-bit characters of the range 0x80..0x9F are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1889 two-byte sequences of LEADING_CODE_8_BIT_CONTROL and (their 8-bit
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1890 code + 0x20).
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1891
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1892 8-bit characters of the range 0xA0..0xFF are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1893 one-byte sequences which are their 8-bit code.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1894
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1895 The other characters are represented by a sequence of `base
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1896 leading-code', optional `extended leading-code', and one or two
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1897 `position-code's. The length of the sequence is determined by the
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1898 base leading-code. Leading-code takes the range 0x81 through 0x9D,
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1899 whereas extended leading-code and position-code take the range 0xA0
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1900 through 0xFF. See `charset.h' for more details about leading-code
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1901 and position-code.
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
1902
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1903 --- CODE RANGE of Emacs' internal format ---
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1904 character set range
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1905 ------------- -----
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1906 ascii 0x00..0x7F
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1907 eight-bit-control LEADING_CODE_8_BIT_CONTROL + 0xA0..0xBF
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1908 eight-bit-graphic 0xA0..0xBF
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1909 ELSE 0x81..0x9D + [0xA0..0xFF]+
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1910 ---------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1911
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1912 As this is the internal character representation, the format is
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1913 usually not used externally (i.e. in a file or in a data sent to a
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1914 process). But, it is possible to have a text externally in this
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1915 format (i.e. by encoding by the coding system `emacs-mule').
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1916
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1917 In that case, a sequence of one-byte codes has a slightly different
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1918 form.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1919
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1920 At first, all characters in eight-bit-control are represented by
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1921 one-byte sequences which are their 8-bit code.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1922
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1923 Next, character composition data are represented by the byte
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1924 sequence of the form: 0x80 METHOD BYTES CHARS COMPONENT ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1925 where,
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1926 METHOD is 0xF2 plus one of composition method (enum
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1927 composition_method),
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1928
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1929 BYTES is 0xA0 plus a byte length of this composition data,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1930
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1931 CHARS is 0xA0 plus a number of characters composed by this
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1932 data,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1933
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
1934 COMPONENTs are characters of multibyte form or composition
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1935 rules encoded by two-byte of ASCII codes.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1936
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1937 In addition, for backward compatibility, the following formats are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1938 also recognized as composition data on decoding.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1939
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1940 0x80 MSEQ ...
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1941 0x80 0xFF MSEQ RULE MSEQ RULE ... MSEQ
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1942
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1943 Here,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1944 MSEQ is a multibyte form but in these special format:
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1945 ASCII: 0xA0 ASCII_CODE+0x80,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1946 other: LEADING_CODE+0x20 FOLLOWING-BYTE ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1947 RULE is a one byte code of the range 0xA0..0xF0 that
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1948 represents a composition rule.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1949 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1950
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1951 char emacs_mule_bytes[256];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1952
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1953
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1954 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1955 Check if a text is encoded in `emacs-mule'. If it is, return 1,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1956 else return 0. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1957
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1958 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1959 detect_coding_emacs_mule (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
1960 struct coding_detection_info *detect_info)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1961 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1962 const unsigned char *src = coding->source, *src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1963 const unsigned char *src_end = coding->source + coding->src_bytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1964 int multibytep = coding->src_multibyte;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1965 int consumed_chars = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1966 int c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1967 int found = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1968
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1969 detect_info->checked |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1970 /* A coding system of this category is always ASCII compatible. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1971 src += coding->head_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1972
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1973 while (1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1974 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1975 src_base = src;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1976 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1977 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1978 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1979 if (c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1980 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1981 /* Perhaps the start of composite character. We simply skip
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1982 it because analyzing it is too heavy for detecting. But,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1983 at least, we check that the composite character
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1984 constitutes of more than 4 bytes. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1985 const unsigned char *src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1986
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1987 repeat:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1988 src_base = src;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1989 do
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1990 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1991 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1992 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1993 while (c >= 0xA0);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1994
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1995 if (src - src_base <= 4)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1996 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1997 found = CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1998 if (c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1999 goto repeat;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2000 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2001
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2002 if (c < 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2003 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2004 if (c < 0x20
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2005 && (c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2006 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2007 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2008 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2009 {
110334
4ad4f097835e coding.c (detect_coding_emacs_mule): Fix checking of multibyte sequence when the source is multibyte.
Kenichi Handa <handa@m17n.org>
parents: 109710
diff changeset
2010 int more_bytes = emacs_mule_bytes[c] - 1;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2011
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2012 while (more_bytes > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2013 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2014 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2015 if (c < 0xA0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2016 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2017 src--; /* Unread the last byte. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2018 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2019 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2020 more_bytes--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2021 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2022 if (more_bytes != 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2023 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2024 found = CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2025 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2026 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2027 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2028 return 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2029
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2030 no_more_source:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2031 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2032 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2033 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2034 return 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2035 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2036 detect_info->found |= found;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2037 return 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2038 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2039
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2040
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2041 /* Parse emacs-mule multibyte sequence at SRC and return the decoded
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2042 character. If CMP_STATUS indicates that we must expect MSEQ or
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2043 RULE described above, decode it and return the negative value of
107323
ebc10ed88b5c (emacs_mule_char): Fix a typo in commentary.
Eli Zaretskii <eliz@gnu.org>
parents: 107321
diff changeset
2044 the decoded character or rule. If an invalid byte is found, return
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2045 -1. If SRC is too short, return -2. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2046
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2047 int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
2048 emacs_mule_char (struct coding_system *coding, const unsigned char *src,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
2049 int *nbytes, int *nchars, int *id,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
2050 struct composition_status *cmp_status)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2051 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2052 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2053 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2054 int multibytep = coding->src_multibyte;
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2055 int charset_id;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2056 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2057 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2058 int consumed_chars = 0;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2059 int mseq_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2060
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2061 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2062 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2063 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2064 c = -c;
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2065 charset_id = emacs_mule_charset[0];
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2066 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2067 else
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2068 {
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2069 if (c >= 0xA0)
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2070 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2071 if (cmp_status->state != COMPOSING_NO
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2072 && cmp_status->old_form)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2073 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2074 if (cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2075 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2076 if (c == 0xA0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2077 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2078 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2079 c -= 0x80;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2080 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2081 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2082 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2083 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2084 c -= 0x20;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2085 mseq_found = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2086 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2087 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2088 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2089 *nbytes = src - src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2090 *nchars = consumed_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2091 return -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2092 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2093 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2094 else
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2095 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2096 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2097
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2098 switch (emacs_mule_bytes[c])
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2099 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2100 case 2:
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2101 if ((charset_id = emacs_mule_charset[c]) < 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2102 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2103 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2104 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2105 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2106 code = c & 0x7F;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2107 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2108
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2109 case 3:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2110 if (c == EMACS_MULE_LEADING_CODE_PRIVATE_11
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2111 || c == EMACS_MULE_LEADING_CODE_PRIVATE_12)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2112 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2113 ONE_MORE_BYTE (c);
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2114 if (c < 0xA0 || (charset_id = emacs_mule_charset[c]) < 0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2115 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2116 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2117 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2118 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2119 code = c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2120 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2121 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2122 {
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2123 if ((charset_id = emacs_mule_charset[c]) < 0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2124 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2125 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2126 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2127 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2128 code = (c & 0x7F) << 8;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2129 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2130 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2131 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2132 code |= c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2133 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2134 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2135
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2136 case 4:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2137 ONE_MORE_BYTE (c);
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2138 if (c < 0 || (charset_id = emacs_mule_charset[c]) < 0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2139 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2140 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2141 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2142 goto invalid_code;
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2143 code = (c & 0x7F) << 8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2144 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2145 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2146 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2147 code |= c & 0x7F;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2148 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2149
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2150 case 1:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2151 code = c;
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2152 charset_id = ASCII_BYTE_P (code) ? charset_ascii : charset_eight_bit;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2153 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2154
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2155 default:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2156 abort ();
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2157 }
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2158 CODING_DECODE_CHAR (coding, src, src_base, src_end,
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2159 CHARSET_FROM_ID (charset_id), code, c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2160 if (c < 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2161 goto invalid_code;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2162 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2163 *nbytes = src - src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2164 *nchars = consumed_chars;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2165 if (id)
111743
913b779aa4ee Fix decoding of emacs-mule coding system.
Kenichi Handa <handa@m17n.org>
parents: 110983
diff changeset
2166 *id = charset_id;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2167 return (mseq_found ? -c : c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2168
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2169 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2170 return -2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2171
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2172 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2173 return -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2174 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2175
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2176
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2177 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2178
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2179 /* Handle these composition sequence ('|': the end of header elements,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2180 BYTES and CHARS >= 0xA0):
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2181
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2182 (1) relative composition: 0x80 0xF2 BYTES CHARS | CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2183 (2) altchar composition: 0x80 0xF4 BYTES CHARS | ALT ... ALT CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2184 (3) alt&rule composition: 0x80 0xF5 BYTES CHARS | ALT RULE ... ALT CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2185
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2186 and these old form:
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
2187
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2188 (4) relative composition: 0x80 | MSEQ ... MSEQ
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2189 (5) rulebase composition: 0x80 0xFF | MSEQ MRULE ... MSEQ
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2190
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2191 When the starter 0x80 and the following header elements are found,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2192 this annotation header is produced.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2193
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2194 [ -LENGTH(==-5) CODING_ANNOTATE_COMPOSITION_MASK NCHARS NBYTES METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2195
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2196 NCHARS is CHARS - 0xA0 for (1), (2), (3), and 0 for (4), (5).
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2197 NBYTES is BYTES - 0xA0 for (1), (2), (3), and 0 for (4), (5).
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2198
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2199 Then, upon reading the following elements, these codes are produced
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2200 until the composition end is found:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2201
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2202 (1) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2203 (2) ALT ... ALT CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2204 (3) ALT -2 DECODED-RULE ALT -2 DECODED-RULE ... ALT CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2205 (4) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2206 (5) CHAR -2 DECODED-RULE CHAR -2 DECODED-RULE ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2207
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2208 When the composition end is found, LENGTH and NCHARS in the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2209 annotation header is updated as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2210
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2211 (1) LENGTH: unchanged, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2212 (2) LENGTH: length of the whole sequence minus NCHARS, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2213 (3) LENGTH: length of the whole sequence minus NCHARS, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2214 (4) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2215 (5) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2216
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2217 If an error is found while composing, the annotation header is
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2218 changed to the original composition header (plus filler -1s) as
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2219 below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2220
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2221 (1),(2),(3) [ 0x80 0xF2+METHOD BYTES CHARS -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2222 (5) [ 0x80 0xFF -1 -1- -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2223
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2224 and the sequence [ -2 DECODED-RULE ] is changed to the original
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2225 byte sequence as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2226 o the original byte sequence is B: [ B -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2227 o the original byte sequence is B1 B2: [ B1 B2 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2228
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2229 Most of the routines are implemented by macros because many
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2230 variables and labels in the caller decode_coding_emacs_mule must be
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2231 accessible, and they are usually called just once (thus doesn't
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2232 increase the size of compiled object). */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2233
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2234 /* Decode a composition rule represented by C as a component of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2235 composition sequence of Emacs 20 style. Set RULE to the decoded
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2236 rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2237
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2238 #define DECODE_EMACS_MULE_COMPOSITION_RULE_20(c, rule) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2239 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2240 int gref, nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2241 \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2242 c -= 0xA0; \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2243 if (c < 0 || c >= 81) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2244 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2245 gref = c / 9, nref = c % 9; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2246 if (gref == 4) gref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2247 if (nref == 4) nref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2248 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2249 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2250
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2251
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2252 /* Decode a composition rule represented by C and the following byte
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2253 at SRC as a component of composition sequence of Emacs 21 style.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2254 Set RULE to the decoded rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2255
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2256 #define DECODE_EMACS_MULE_COMPOSITION_RULE_21(c, rule) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2257 do { \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2258 int gref, nref; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2259 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2260 gref = c - 0x20; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2261 if (gref < 0 || gref >= 81) \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2262 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2263 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2264 nref = c - 0x20; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2265 if (nref < 0 || nref >= 81) \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2266 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2267 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2268 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2269
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2270
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2271 /* Start of Emacs 21 style format. The first three bytes at SRC are
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2272 (METHOD - 0xF2), (BYTES - 0xA0), (CHARS - 0xA0), where BYTES is the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2273 byte length of this composition information, CHARS is the number of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2274 characters composed by this composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2275
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2276 #define DECODE_EMACS_MULE_21_COMPOSITION() \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2277 do { \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2278 enum composition_method method = c - 0xF2; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2279 int nbytes, nchars; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2280 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2281 ONE_MORE_BYTE (c); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2282 if (c < 0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2283 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2284 nbytes = c - 0xA0; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2285 if (nbytes < 3 || (method == COMPOSITION_RELATIVE && nbytes != 4)) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2286 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2287 ONE_MORE_BYTE (c); \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2288 nchars = c - 0xA0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2289 if (nchars <= 0 || nchars >= MAX_COMPOSITION_COMPONENTS) \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2290 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2291 cmp_status->old_form = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2292 cmp_status->method = method; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2293 if (method == COMPOSITION_RELATIVE) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2294 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2295 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2296 cmp_status->state = COMPOSING_COMPONENT_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2297 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2298 cmp_status->nchars = nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2299 cmp_status->ncomps = nbytes - 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2300 ADD_COMPOSITION_DATA (charbuf, nchars, nbytes, method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2301 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2302
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2303
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2304 /* Start of Emacs 20 style format for relative composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2305
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2306 #define DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2307 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2308 cmp_status->old_form = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2309 cmp_status->method = COMPOSITION_RELATIVE; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2310 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2311 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2312 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2313 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2314 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2315
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2316
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2317 /* Start of Emacs 20 style format for rule-base composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2318
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2319 #define DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2320 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2321 cmp_status->old_form = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2322 cmp_status->method = COMPOSITION_WITH_RULE; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2323 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2324 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2325 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2326 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2327 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2328
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2329
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2330 #define DECODE_EMACS_MULE_COMPOSITION_START() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2331 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2332 const unsigned char *current_src = src; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2333 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2334 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2335 if (c < 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2336 goto invalid_code; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2337 if (c - 0xF2 >= COMPOSITION_RELATIVE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2338 && c - 0xF2 <= COMPOSITION_WITH_RULE_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2339 DECODE_EMACS_MULE_21_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2340 else if (c < 0xA0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2341 goto invalid_code; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2342 else if (c < 0xC0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2343 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2344 DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2345 /* Re-read C as a composition component. */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2346 src = current_src; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2347 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2348 else if (c == 0xFF) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2349 DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2350 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2351 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2352 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2353
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2354 #define EMACS_MULE_COMPOSITION_END() \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2355 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2356 int idx = - cmp_status->length; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2357 \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2358 if (cmp_status->old_form) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2359 charbuf[idx + 2] = cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2360 else if (cmp_status->method > COMPOSITION_RELATIVE) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2361 charbuf[idx] = charbuf[idx + 2] - cmp_status->length; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2362 cmp_status->state = COMPOSING_NO; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2363 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2364
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2365
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2366 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
2367 emacs_mule_finish_composition (int *charbuf,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
2368 struct composition_status *cmp_status)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2369 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2370 int idx = - cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2371 int new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2372
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2373 if (cmp_status->old_form && cmp_status->nchars > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2374 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2375 charbuf[idx + 2] = cmp_status->nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2376 new_chars = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2377 if (cmp_status->method == COMPOSITION_WITH_RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2378 && cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2379 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2380 /* The last rule was invalid. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2381 int rule = charbuf[-1] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2382
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2383 charbuf[-2] = BYTE8_TO_CHAR (rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2384 charbuf[-1] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2385 new_chars = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2386 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2387 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2388 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2389 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2390 charbuf[idx++] = BYTE8_TO_CHAR (0x80);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2391
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2392 if (cmp_status->method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2393 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2394 charbuf[idx++] = BYTE8_TO_CHAR (0xFF);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2395 charbuf[idx++] = -3;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2396 charbuf[idx++] = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2397 new_chars = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2398 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2399 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2400 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2401 int nchars = charbuf[idx + 1] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2402 int nbytes = charbuf[idx + 2] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2403
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2404 charbuf[idx++] = BYTE8_TO_CHAR (0xF2 + cmp_status->method);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2405 charbuf[idx++] = BYTE8_TO_CHAR (nbytes);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2406 charbuf[idx++] = BYTE8_TO_CHAR (nchars);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2407 charbuf[idx++] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2408 new_chars = 4;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2409 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2410 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2411 cmp_status->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2412 return new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2413 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2414
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2415 #define EMACS_MULE_MAYBE_FINISH_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2416 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2417 if (cmp_status->state != COMPOSING_NO) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2418 char_offset += emacs_mule_finish_composition (charbuf, cmp_status); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2419 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2420
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2421
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2422 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
2423 decode_coding_emacs_mule (struct coding_system *coding)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2424 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2425 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2426 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
2427 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2428 int *charbuf = coding->charbuf + coding->charbuf_used;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
2429 /* We may produce two annotations (charset and composition) in one
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
2430 loop and one more charset annotation at the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2431 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
2432 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 3);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2433 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2434 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2435 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2436 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2437 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2438 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
2439 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
2440 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2441 int byte_after_cr = -1;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2442 struct composition_status *cmp_status = &coding->spec.emacs_mule.cmp_status;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2443
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2444 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2445
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2446 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2447 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2448 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2449
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2450 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2451 *charbuf++ = cmp_status->carryover[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2452 coding->annotated = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2453 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2454
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2455 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2456 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2457 int c, id;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2458
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2459 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2460 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2461
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2462 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2463 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2464 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2465 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2466 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2467 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2468
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2469 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2470 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2471 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2472 ONE_MORE_BYTE (c);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2473
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2474 if (c < 0 || c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2475 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2476 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2477 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2478 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2479 *charbuf++ = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2480 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2481 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2482 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2483 DECODE_EMACS_MULE_COMPOSITION_START ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2484 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2485 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2486
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2487 if (c < 0x80)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2488 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2489 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2490 ONE_MORE_BYTE (byte_after_cr);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2491 id = charset_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2492 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2493 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2494 if (cmp_status->old_form)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2495 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2496 else if (cmp_status->state >= COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2497 cmp_status->ncomps--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2498 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2499 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2500 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2501 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2502 int nchars, nbytes;
107321
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2503 /* emacs_mule_char can load a charset map from a file, which
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2504 allocates a large structure and might cause buffer text
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2505 to be relocated as result. Thus, we need to remember the
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
2506 original pointer to buffer text, and fix up all related
107321
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2507 pointers after the call. */
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2508 const unsigned char *orig = coding->source;
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2509 EMACS_INT offset;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2510
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2511 c = emacs_mule_char (coding, src_base, &nbytes, &nchars, &id,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2512 cmp_status);
107321
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2513 offset = coding->source - orig;
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2514 if (offset)
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2515 {
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2516 src += offset;
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2517 src_base += offset;
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2518 src_end += offset;
9b814b3ee348 Fix bug in decoding emacs-mule encoding.
Eli Zaretskii <eliz@gnu.org>
parents: 107174
diff changeset
2519 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2520 if (c < 0)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2521 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2522 if (c == -1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2523 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2524 if (c == -2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2525 break;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2526 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2527 src = src_base + nbytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2528 consumed_chars = consumed_chars_base + nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2529 if (cmp_status->state >= COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2530 cmp_status->ncomps -= nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2531 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2532
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
2533 /* Now if C >= 0, we found a normally encoded character, if C <
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2534 0, we found an old-style composition component character or
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2535 rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2536
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2537 if (cmp_status->state == COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2538 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2539 if (last_id != id)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2540 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2541 if (last_id != charset_ascii)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2542 ADD_CHARSET_DATA (charbuf, char_offset - last_offset,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2543 last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2544 last_id = id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2545 last_offset = char_offset;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2546 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2547 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2548 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2549 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2550 else if (cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2551 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2552 if (cmp_status->old_form)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2553 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2554 if (c >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2555 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2556 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2557 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2558 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2559 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2560 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2561 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2562 *charbuf++ = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2563 cmp_status->nchars++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2564 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2565 if (cmp_status->nchars == MAX_COMPOSITION_COMPONENTS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2566 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2567 else if (cmp_status->method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2568 cmp_status->state = COMPOSING_RULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2569 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2570 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2571 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2572 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2573 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2574 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2575 cmp_status->nchars--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2576 if (cmp_status->nchars == 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2577 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2578 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2579 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2580 else if (cmp_status->state == COMPOSING_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2581 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2582 int rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2583
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2584 if (c >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2585 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2586 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2587 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2588 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2589 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2590 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2591 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2592 c = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2593 DECODE_EMACS_MULE_COMPOSITION_RULE_20 (c, rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2594 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2595 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2596 *charbuf++ = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2597 *charbuf++ = rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2598 cmp_status->length += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2599 cmp_status->state = COMPOSING_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2600 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2601 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2602 else if (cmp_status->state == COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2603 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2604 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2605 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2606 if (cmp_status->ncomps == 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2607 cmp_status->state = COMPOSING_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2608 else if (cmp_status->ncomps > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2609 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2610 if (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2611 cmp_status->state = COMPOSING_COMPONENT_RULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2612 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2613 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2614 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2615 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2616 else /* COMPOSING_COMPONENT_RULE */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2617 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2618 int rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2619
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2620 DECODE_EMACS_MULE_COMPOSITION_RULE_21 (c, rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2621 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2622 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2623 *charbuf++ = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2624 *charbuf++ = rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2625 cmp_status->length += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2626 cmp_status->ncomps--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2627 if (cmp_status->ncomps > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2628 cmp_status->state = COMPOSING_COMPONENT_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2629 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2630 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2631 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2632 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2633
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2634 invalid_code:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2635 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2636 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2637 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2638 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2639 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2640 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2641 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2642 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2643
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2644 no_more_source:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2645 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2646 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2647 if (coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2648 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2649 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2650 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2651 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2652
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2653 charbuf -= cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2654 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2655 cmp_status->carryover[i] = charbuf[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2656 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2657 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2658 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2659 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2660 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2661 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2662 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2663 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2664
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2665
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2666 #define EMACS_MULE_LEADING_CODES(id, codes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2667 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2668 if (id < 0xA0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2669 codes[0] = id, codes[1] = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2670 else if (id < 0xE0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2671 codes[0] = 0x9A, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2672 else if (id < 0xF0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2673 codes[0] = 0x9B, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2674 else if (id < 0xF5) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2675 codes[0] = 0x9C, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2676 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2677 codes[0] = 0x9D, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2678 } while (0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2679
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2680
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2681 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
2682 encode_coding_emacs_mule (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2683 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2684 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2685 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2686 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2687 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2688 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2689 int safe_room = 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2690 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2691 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2692 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2693 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2694
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2695 CODING_GET_INFO (coding, attrs, charset_list);
89644
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2696 if (! EQ (charset_list, Vemacs_mule_charset_list))
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2697 {
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2698 CODING_ATTR_CHARSET_LIST (attrs)
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2699 = charset_list = Vemacs_mule_charset_list;
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2700 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2701
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2702 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2703 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2704 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2705 c = *charbuf++;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2706
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2707 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2708 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2709 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2710 switch (*charbuf)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2711 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2712 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2713 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2714 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2715 case CODING_ANNOTATE_CHARSET_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2716 preferred_charset_id = charbuf[3];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2717 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2718 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2719 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2720 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2721 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2722 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2723 abort ();
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2724 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2725 charbuf += -c - 1;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2726 continue;
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2727 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2728
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2729 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2730 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2731 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2732 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2733 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2734 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2735 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2736 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2737 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2738 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2739 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2740 int dimension;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2741 int emacs_mule_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2742 unsigned char leading_codes[2];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2743
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2744 if (preferred_charset_id >= 0)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2745 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2746 charset = CHARSET_FROM_ID (preferred_charset_id);
100176
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2747 if (CHAR_CHARSET_P (c, charset))
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2748 code = ENCODE_CHAR (charset, c);
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2749 else
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2750 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2751 }
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2752 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2753 charset = char_charset (c, charset_list, &code);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2754 if (! charset)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2755 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2756 c = coding->default_char;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2757 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2758 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2759 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2760 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2761 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2762 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2763 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2764 dimension = CHARSET_DIMENSION (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2765 emacs_mule_id = CHARSET_EMACS_MULE_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2766 EMACS_MULE_LEADING_CODES (emacs_mule_id, leading_codes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2767 EMIT_ONE_BYTE (leading_codes[0]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2768 if (leading_codes[1])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2769 EMIT_ONE_BYTE (leading_codes[1]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2770 if (dimension == 1)
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2771 EMIT_ONE_BYTE (code | 0x80);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2772 else
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2773 {
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2774 code |= 0x8080;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2775 EMIT_ONE_BYTE (code >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2776 EMIT_ONE_BYTE (code & 0xFF);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2777 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2778 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2779 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2780 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2781 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2782 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2783 return 0;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2784 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2785
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2786
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2787 /*** 7. ISO2022 handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2788
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2789 /* The following note describes the coding system ISO2022 briefly.
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2790 Since the intention of this note is to help understand the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2791 functions in this file, some parts are NOT ACCURATE or are OVERLY
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2792 SIMPLIFIED. For thorough understanding, please refer to the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2793 original document of ISO2022. This is equivalent to the standard
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2794 ECMA-35, obtainable from <URL:http://www.ecma.ch/> (*).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2795
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2796 ISO2022 provides many mechanisms to encode several character sets
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2797 in 7-bit and 8-bit environments. For 7-bit environments, all text
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2798 is encoded using bytes less than 128. This may make the encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2799 text a little bit longer, but the text passes more easily through
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2800 several types of gateway, some of which strip off the MSB (Most
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2801 Significant Bit).
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2802
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2803 There are two kinds of character sets: control character sets and
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2804 graphic character sets. The former contain control characters such
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2805 as `newline' and `escape' to provide control functions (control
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2806 functions are also provided by escape sequences). The latter
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2807 contain graphic characters such as 'A' and '-'. Emacs recognizes
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2808 two control character sets and many graphic character sets.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2809
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2810 Graphic character sets are classified into one of the following
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2811 four classes, according to the number of bytes (DIMENSION) and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2812 number of characters in one dimension (CHARS) of the set:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2813 - DIMENSION1_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2814 - DIMENSION1_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2815 - DIMENSION2_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2816 - DIMENSION2_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2817
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2818 In addition, each character set is assigned an identification tag,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2819 unique for each set, called the "final character" (denoted as <F>
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2820 hereafter). The <F> of each character set is decided by ECMA(*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2821 when it is registered in ISO. The code range of <F> is 0x30..0x7F
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2822 (0x30..0x3F are for private use only).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2823
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2824 Note (*): ECMA = European Computer Manufacturers Association
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2825
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2826 Here are examples of graphic character sets [NAME(<F>)]:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2827 o DIMENSION1_CHARS94 -- ASCII('B'), right-half-of-JISX0201('I'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2828 o DIMENSION1_CHARS96 -- right-half-of-ISO8859-1('A'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2829 o DIMENSION2_CHARS94 -- GB2312('A'), JISX0208('B'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2830 o DIMENSION2_CHARS96 -- none for the moment
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2831
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2832 A code area (1 byte=8 bits) is divided into 4 areas, C0, GL, C1, and GR.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2833 C0 [0x00..0x1F] -- control character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2834 GL [0x20..0x7F] -- graphic character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2835 C1 [0x80..0x9F] -- control character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2836 GR [0xA0..0xFF] -- graphic character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2837
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2838 A control character set is directly designated and invoked to C0 or
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2839 C1 by an escape sequence. The most common case is that:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2840 - ISO646's control character set is designated/invoked to C0, and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2841 - ISO6429's control character set is designated/invoked to C1,
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2842 and usually these designations/invocations are omitted in encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2843 text. In a 7-bit environment, only C0 can be used, and a control
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2844 character for C1 is encoded by an appropriate escape sequence to
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2845 fit into the environment. All control characters for C1 are
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2846 defined to have corresponding escape sequences.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2847
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2848 A graphic character set is at first designated to one of four
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2849 graphic registers (G0 through G3), then these graphic registers are
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2850 invoked to GL or GR. These designations and invocations can be
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2851 done independently. The most common case is that G0 is invoked to
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2852 GL, G1 is invoked to GR, and ASCII is designated to G0. Usually
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2853 these invocations and designations are omitted in encoded text.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2854 In a 7-bit environment, only GL can be used.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2855
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2856 When a graphic character set of CHARS94 is invoked to GL, codes
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2857 0x20 and 0x7F of the GL area work as control characters SPACE and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2858 DEL respectively, and codes 0xA0 and 0xFF of the GR area should not
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2859 be used.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2860
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2861 There are two ways of invocation: locking-shift and single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2862 With locking-shift, the invocation lasts until the next different
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2863 invocation, whereas with single-shift, the invocation affects the
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2864 following character only and doesn't affect the locking-shift
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2865 state. Invocations are done by the following control characters or
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2866 escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2867
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2868 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2869 abbrev function cntrl escape seq description
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2870 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2871 SI/LS0 (shift-in) 0x0F none invoke G0 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2872 SO/LS1 (shift-out) 0x0E none invoke G1 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2873 LS2 (locking-shift-2) none ESC 'n' invoke G2 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2874 LS3 (locking-shift-3) none ESC 'o' invoke G3 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2875 LS1R (locking-shift-1 right) none ESC '~' invoke G1 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2876 LS2R (locking-shift-2 right) none ESC '}' invoke G2 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2877 LS3R (locking-shift 3 right) none ESC '|' invoke G3 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2878 SS2 (single-shift-2) 0x8E ESC 'N' invoke G2 for one char
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2879 SS3 (single-shift-3) 0x8F ESC 'O' invoke G3 for one char
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2880 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2881 (*) These are not used by any known coding system.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2882
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2883 Control characters for these functions are defined by macros
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2884 ISO_CODE_XXX in `coding.h'.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2885
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2886 Designations are done by the following escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2887 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2888 escape sequence description
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2889 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2890 ESC '(' <F> designate DIMENSION1_CHARS94<F> to G0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2891 ESC ')' <F> designate DIMENSION1_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2892 ESC '*' <F> designate DIMENSION1_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2893 ESC '+' <F> designate DIMENSION1_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2894 ESC ',' <F> designate DIMENSION1_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2895 ESC '-' <F> designate DIMENSION1_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2896 ESC '.' <F> designate DIMENSION1_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2897 ESC '/' <F> designate DIMENSION1_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2898 ESC '$' '(' <F> designate DIMENSION2_CHARS94<F> to G0 (**)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2899 ESC '$' ')' <F> designate DIMENSION2_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2900 ESC '$' '*' <F> designate DIMENSION2_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2901 ESC '$' '+' <F> designate DIMENSION2_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2902 ESC '$' ',' <F> designate DIMENSION2_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2903 ESC '$' '-' <F> designate DIMENSION2_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2904 ESC '$' '.' <F> designate DIMENSION2_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2905 ESC '$' '/' <F> designate DIMENSION2_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2906 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2907
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2908 In this list, "DIMENSION1_CHARS94<F>" means a graphic character set
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2909 of dimension 1, chars 94, and final character <F>, etc...
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2910
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2911 Note (*): Although these designations are not allowed in ISO2022,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2912 Emacs accepts them on decoding, and produces them on encoding
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2913 CHARS96 character sets in a coding system which is characterized as
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2914 7-bit environment, non-locking-shift, and non-single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2915
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2916 Note (**): If <F> is '@', 'A', or 'B', the intermediate character
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2917 '(' must be omitted. We refer to this as "short-form" hereafter.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2918
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2919 Now you may notice that there are a lot of ways of encoding the
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2920 same multilingual text in ISO2022. Actually, there exist many
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2921 coding systems such as Compound Text (used in X11's inter client
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2922 communication, ISO-2022-JP (used in Japanese Internet), ISO-2022-KR
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2923 (used in Korean Internet), EUC (Extended UNIX Code, used in Asian
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2924 localized platforms), and all of these are variants of ISO2022.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2925
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2926 In addition to the above, Emacs handles two more kinds of escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2927 sequences: ISO6429's direction specification and Emacs' private
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2928 sequence for specifying character composition.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2929
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2930 ISO6429's direction specification takes the following form:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2931 o CSI ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2932 o CSI '0' ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2933 o CSI '1' ']' -- start of left-to-right text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2934 o CSI '2' ']' -- start of right-to-left text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2935 The control character CSI (0x9B: control sequence introducer) is
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2936 abbreviated to the escape sequence ESC '[' in a 7-bit environment.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2937
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2938 Character composition specification takes the following form:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2939 o ESC '0' -- start relative composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2940 o ESC '1' -- end composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2941 o ESC '2' -- start rule-base composition (*)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2942 o ESC '3' -- start relative composition with alternate chars (**)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2943 o ESC '4' -- start rule-base composition with alternate chars (**)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2944 Since these are not standard escape sequences of any ISO standard,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2945 the use of them with these meanings is restricted to Emacs only.
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2946
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2947 (*) This form is used only in Emacs 20.7 and older versions,
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2948 but newer versions can safely decode it.
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2949 (**) This form is used only in Emacs 21.1 and newer versions,
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2950 and older versions can't decode it.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2951
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2952 Here's a list of example usages of these composition escape
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2953 sequences (categorized by `enum composition_method').
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2954
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2955 COMPOSITION_RELATIVE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2956 ESC 0 CHAR [ CHAR ] ESC 1
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2957 COMPOSITION_WITH_RULE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2958 ESC 2 CHAR [ RULE CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2959 COMPOSITION_WITH_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2960 ESC 3 ALTCHAR [ ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2961 COMPOSITION_WITH_RULE_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2962 ESC 4 ALTCHAR [ RULE ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2963
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2964 enum iso_code_class_type iso_code_class[256];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2965
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2966 #define SAFE_CHARSET_P(coding, id) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2967 ((id) <= (coding)->max_charset_id \
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
2968 && (coding)->safe_charsets[id] != 255)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2969
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2970
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2971 #define SHIFT_OUT_OK(category) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2972 (CODING_ISO_INITIAL (&coding_categories[category], 1) >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2973
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2974 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
2975 setup_iso_safe_charsets (Lisp_Object attrs)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2976 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2977 Lisp_Object charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2978 Lisp_Object request;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2979 Lisp_Object reg_usage;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2980 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2981 int reg94, reg96;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2982 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2983 int max_charset_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2984
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2985 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2986 if ((flags & CODING_ISO_FLAG_FULL_SUPPORT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2987 && ! EQ (charset_list, Viso_2022_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2988 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2989 CODING_ATTR_CHARSET_LIST (attrs)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2990 = charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2991 ASET (attrs, coding_attr_safe_charsets, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2992 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2993
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2994 if (STRINGP (AREF (attrs, coding_attr_safe_charsets)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2995 return;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2996
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2997 max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2998 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2999 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3000 int id = XINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3001 if (max_charset_id < id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3002 max_charset_id = id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3003 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3004
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3005 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3006 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3007 request = AREF (attrs, coding_attr_iso_request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3008 reg_usage = AREF (attrs, coding_attr_iso_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3009 reg94 = XINT (XCAR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3010 reg96 = XINT (XCDR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3011
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3012 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3013 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3014 Lisp_Object id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3015 Lisp_Object reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3016 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3017
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3018 id = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3019 charset = CHARSET_FROM_ID (XINT (id));
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3020 reg = Fcdr (Fassq (id, request));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3021 if (! NILP (reg))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3022 SSET (safe_charsets, XINT (id), XINT (reg));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3023 else if (charset->iso_chars_96)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3024 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3025 if (reg96 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3026 SSET (safe_charsets, XINT (id), reg96);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3027 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3028 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3029 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3030 if (reg94 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3031 SSET (safe_charsets, XINT (id), reg94);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3032 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3033 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3034 ASET (attrs, coding_attr_safe_charsets, safe_charsets);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3035 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3036
50047
8e17fbb2ac77 (CODING_ADD_COMPOSITION_COMPONENT): If the number of
Kenichi Handa <handa@m17n.org>
parents: 49600
diff changeset
3037
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3038 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
3039 Check if a text is encoded in one of ISO-2022 based coding systems.
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3040 If it is, return 1, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3041
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
3042 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
3043 detect_coding_iso_2022 (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
3044 struct coding_detection_info *detect_info)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3045 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3046 const unsigned char *src = coding->source, *src_base = src;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3047 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3048 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3049 int single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3050 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3051 int c, c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3052 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3053 int i;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3054 int rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3055 int found = 0;
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3056 int composition_count = -1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3057
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3058 detect_info->checked |= CATEGORY_MASK_ISO;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3059
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3060 for (i = coding_category_iso_7; i <= coding_category_iso_8_else; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3061 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3062 struct coding_system *this = &(coding_categories[i]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3063 Lisp_Object attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3064
94944
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
3065 if (this->id < 0)
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
3066 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3067 attrs = CODING_ID_ATTRS (this->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3068 if (CODING_ISO_FLAGS (this) & CODING_ISO_FLAG_FULL_SUPPORT
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3069 && ! EQ (CODING_ATTR_CHARSET_LIST (attrs), Viso_2022_charset_list))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3070 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3071 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3072 this->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3073 this->safe_charsets = SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3074 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3075
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3076 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3077 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3078
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3079 while (rejected != CATEGORY_MASK_ISO)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3080 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3081 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3082 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3083 switch (c)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3084 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3085 case ISO_CODE_ESC:
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3086 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3087 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3088 single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3089 ONE_MORE_BYTE (c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3090 if (c >= '(' && c <= '/')
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3091 {
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3092 /* Designation sequence for a charset of dimension 1. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3093 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3094 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3095 || (id = iso_charset_table[0][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3096 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3097 break;
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3098 }
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3099 else if (c == '$')
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3100 {
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3101 /* Designation sequence for a charset of dimension 2. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3102 ONE_MORE_BYTE (c);
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3103 if (c >= '@' && c <= 'B')
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3104 /* Designation for JISX0208.1978, GB2312, or JISX0208. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3105 id = iso_charset_table[1][0][c];
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3106 else if (c >= '(' && c <= '/')
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
3107 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3108 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3109 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3110 || (id = iso_charset_table[1][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3111 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3112 break;
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
3113 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3114 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3115 /* Invalid designation sequence. Just ignore it. */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3116 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3117 }
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3118 else if (c == 'N' || c == 'O')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3119 {
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3120 /* ESC <Fe> for SS2 or SS3. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3121 single_shifting = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3122 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3123 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3124 }
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3125 else if (c == '1')
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3126 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3127 /* End of composition. */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3128 if (composition_count < 0
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3129 || composition_count > MAX_COMPOSITION_COMPONENTS)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3130 /* Invalid */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3131 break;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3132 composition_count = -1;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3133 found |= CATEGORY_MASK_ISO;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3134 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3135 else if (c >= '0' && c <= '4')
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3136 {
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3137 /* ESC <Fp> for start/end composition. */
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3138 composition_count = 0;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3139 break;
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3140 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3141 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3142 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3143 /* Invalid escape sequence. Just ignore it. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3144 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3145 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3146
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3147 /* We found a valid designation sequence for CHARSET. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3148 rejected |= CATEGORY_MASK_ISO_8BIT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3149 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3150 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3151 found |= CATEGORY_MASK_ISO_7;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3152 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3153 rejected |= CATEGORY_MASK_ISO_7;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3154 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_tight],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3155 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3156 found |= CATEGORY_MASK_ISO_7_TIGHT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3157 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3158 rejected |= CATEGORY_MASK_ISO_7_TIGHT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3159 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3160 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3161 found |= CATEGORY_MASK_ISO_7_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3162 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3163 rejected |= CATEGORY_MASK_ISO_7_ELSE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3164 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_8_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3165 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3166 found |= CATEGORY_MASK_ISO_8_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3167 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3168 rejected |= CATEGORY_MASK_ISO_8_ELSE;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3169 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3170
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3171 case ISO_CODE_SO:
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3172 case ISO_CODE_SI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3173 /* Locking shift out/in. */
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3174 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3175 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3176 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3177 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3178 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3179
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3180 case ISO_CODE_CSI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3181 /* Control sequence introducer. */
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3182 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3183 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3184 found |= CATEGORY_MASK_ISO_8_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3185 goto check_extra_latin;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3186
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3187 case ISO_CODE_SS2:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3188 case ISO_CODE_SS3:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3189 /* Single shift. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3190 if (inhibit_iso_escape_detection)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3191 break;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3192 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3193 rejected |= CATEGORY_MASK_ISO_7BIT;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3194 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3195 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3196 found |= CATEGORY_MASK_ISO_8_1, single_shifting = 1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3197 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_2])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3198 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3199 found |= CATEGORY_MASK_ISO_8_2, single_shifting = 1;
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3200 if (single_shifting)
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3201 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3202 goto check_extra_latin;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3203
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3204 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3205 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3206 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3207 if (c < 0x80)
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3208 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3209 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3210 composition_count++;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3211 single_shifting = 0;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3212 break;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3213 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3214 if (c >= 0xA0)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
3215 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3216 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3217 found |= CATEGORY_MASK_ISO_8_1;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3218 /* Check the length of succeeding codes of the range
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3219 0xA0..0FF. If the byte length is even, we include
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3220 CATEGORY_MASK_ISO_8_2 in `found'. We can check this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3221 only when we are not single shifting. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3222 if (! single_shifting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3223 && ! (rejected & CATEGORY_MASK_ISO_8_2))
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3224 {
29299
b33b38d81020 (detect_coding_iso2022): Fix code for checking
Kenichi Handa <handa@m17n.org>
parents: 29275
diff changeset
3225 int i = 1;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3226 while (src < src_end)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3227 {
106826
64cd76243389 Fix handling of euc-xx coding systems.
Kenichi Handa <handa@m17n.org>
parents: 106815
diff changeset
3228 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3229 ONE_MORE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3230 if (c < 0xA0)
106826
64cd76243389 Fix handling of euc-xx coding systems.
Kenichi Handa <handa@m17n.org>
parents: 106815
diff changeset
3231 {
64cd76243389 Fix handling of euc-xx coding systems.
Kenichi Handa <handa@m17n.org>
parents: 106815
diff changeset
3232 src = src_base;
64cd76243389 Fix handling of euc-xx coding systems.
Kenichi Handa <handa@m17n.org>
parents: 106815
diff changeset
3233 break;
64cd76243389 Fix handling of euc-xx coding systems.
Kenichi Handa <handa@m17n.org>
parents: 106815
diff changeset
3234 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3235 i++;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3236 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3237
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3238 if (i & 1 && src < src_end)
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3239 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3240 rejected |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3241 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3242 composition_count += i;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3243 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3244 else
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3245 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3246 found |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3247 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3248 composition_count += i / 2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3249 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3250 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3251 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3252 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3253 check_extra_latin:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3254 single_shifting = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3255 if (! VECTORP (Vlatin_extra_code_table)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3256 || NILP (XVECTOR (Vlatin_extra_code_table)->contents[c]))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3257 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3258 rejected = CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3259 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3260 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3261 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3262 & CODING_ISO_FLAG_LATIN_EXTRA)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3263 found |= CATEGORY_MASK_ISO_8_1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3264 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3265 rejected |= CATEGORY_MASK_ISO_8_1;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3266 rejected |= CATEGORY_MASK_ISO_8_2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3267 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3268 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3269 detect_info->rejected |= CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3270 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3271
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3272 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3273 detect_info->rejected |= rejected;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3274 detect_info->found |= (found & ~rejected);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3275 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3276 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3277
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3278
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3279 /* Set designation state into CODING. Set CHARS_96 to -1 if the
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3280 escape sequence should be kept. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3281 #define DECODE_DESIGNATION(reg, dim, chars_96, final) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3282 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3283 int id, prev; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3284 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3285 if (final < '0' || final >= 128 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3286 || ((id = ISO_CHARSET_TABLE (dim, chars_96, final)) < 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3287 || !SAFE_CHARSET_P (coding, id)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3288 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3289 CODING_ISO_DESIGNATION (coding, reg) = -2; \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3290 chars_96 = -1; \
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3291 break; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3292 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3293 prev = CODING_ISO_DESIGNATION (coding, reg); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3294 if (id == charset_jisx0201_roman) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3295 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3296 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3297 id = charset_ascii; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3298 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3299 else if (id == charset_jisx0208_1978) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3300 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3301 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3302 id = charset_jisx0208; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3303 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3304 CODING_ISO_DESIGNATION (coding, reg) = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3305 /* If there was an invalid designation to REG previously, and this \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3306 designation is ASCII to REG, we should keep this designation \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3307 sequence. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3308 if (prev == -2 && id == charset_ascii) \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3309 chars_96 = -1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3310 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3311
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3312
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3313 /* Handle these composition sequence (ALT: alternate char):
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3314
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3315 (1) relative composition: ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3316 (2) rulebase composition: ESC 2 CHAR RULE CHAR RULE ... CHAR ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3317 (3) altchar composition: ESC 3 ALT ... ALT ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3318 (4) alt&rule composition: ESC 4 ALT RULE ... ALT ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3319
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3320 When the start sequence (ESC 0/2/3/4) is found, this annotation
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3321 header is produced.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3322
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3323 [ -LENGTH(==-5) CODING_ANNOTATE_COMPOSITION_MASK NCHARS(==0) 0 METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3324
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3325 Then, upon reading CHAR or RULE (one or two bytes), these codes are
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3326 produced until the end sequence (ESC 1) is found:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3327
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3328 (1) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3329 (2) CHAR -2 DECODED-RULE CHAR -2 DECODED-RULE ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3330 (3) ALT ... ALT -1 -1 CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3331 (4) ALT -2 DECODED-RULE ALT -2 DECODED-RULE ... ALT -1 -1 CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3332
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3333 When the end sequence (ESC 1) is found, LENGTH and NCHARS in the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3334 annotation header is updated as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3335
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3336 (1) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3337 (2) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3338 (3) LENGTH: += number of ALTs + 2, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3339 (4) LENGTH: += number of ALTs * 3, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3340
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3341 If an error is found while composing, the annotation header is
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3342 changed to:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3343
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3344 [ ESC '0'/'2'/'3'/'4' -2 0 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3345
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3346 and the sequence [ -2 DECODED-RULE ] is changed to the original
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3347 byte sequence as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3348 o the original byte sequence is B: [ B -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3349 o the original byte sequence is B1 B2: [ B1 B2 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3350 and the sequence [ -1 -1 ] is changed to the original byte
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3351 sequence:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3352 [ ESC '0' ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3353 */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3354
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3355 /* Decode a composition rule C1 and maybe one more byte from the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3356 source, and set RULE to the encoded composition rule, NBYTES to the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3357 length of the composition rule. If the rule is invalid, set RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3358 to some negative value. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3359
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3360 #define DECODE_COMPOSITION_RULE(rule, nbytes) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3361 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3362 rule = c1 - 32; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3363 if (rule < 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3364 break; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3365 if (rule < 81) /* old format (before ver.21) */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3366 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3367 int gref = (rule) / 9; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3368 int nref = (rule) % 9; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3369 if (gref == 4) gref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3370 if (nref == 4) nref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3371 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3372 nbytes = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3373 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3374 else /* new format (after ver.21) */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3375 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3376 int c; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3377 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3378 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3379 rule = COMPOSITION_ENCODE_RULE (rule - 81, c - 32); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3380 if (rule >= 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3381 rule += 0x100; /* to destinguish it from the old format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3382 nbytes = 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3383 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3384 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3385
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3386 #define ENCODE_COMPOSITION_RULE(rule) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3387 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3388 int gref = (rule % 0x100) / 12, nref = (rule % 0x100) % 12; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3389 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3390 if (rule < 0x100) /* old format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3391 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3392 if (gref == 10) gref = 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3393 if (nref == 10) nref = 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3394 charbuf[idx] = 32 + gref * 9 + nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3395 charbuf[idx + 1] = -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3396 new_chars++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3397 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3398 else /* new format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3399 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3400 charbuf[idx] = 32 + 81 + gref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3401 charbuf[idx + 1] = 32 + nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3402 new_chars += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3403 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3404 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3405
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3406 /* Finish the current composition as invalid. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3407
109100
2bc9a0c04c87 Remove __P and P_ from .c and .m files and definition of P_
Jan D <jan.h.d@swipnet.se>
parents: 107984
diff changeset
3408 static int finish_composition (int *, struct composition_status *);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3409
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3410 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
3411 finish_composition (int *charbuf, struct composition_status *cmp_status)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3412 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3413 int idx = - cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3414 int new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3415
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3416 /* Recover the original ESC sequence */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3417 charbuf[idx++] = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3418 charbuf[idx++] = (cmp_status->method == COMPOSITION_RELATIVE ? '0'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3419 : cmp_status->method == COMPOSITION_WITH_RULE ? '2'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3420 : cmp_status->method == COMPOSITION_WITH_ALTCHARS ? '3'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3421 /* cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3422 : '4');
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3423 charbuf[idx++] = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3424 charbuf[idx++] = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3425 charbuf[idx++] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3426 new_chars = cmp_status->nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3427 if (cmp_status->method >= COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3428 for (; idx < 0; idx++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3429 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3430 int elt = charbuf[idx];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3431
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3432 if (elt == -2)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3433 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3434 ENCODE_COMPOSITION_RULE (charbuf[idx + 1]);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3435 idx++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3436 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3437 else if (elt == -1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3438 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3439 charbuf[idx++] = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3440 charbuf[idx] = '0';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3441 new_chars += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3442 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3443 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3444 cmp_status->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3445 return new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3446 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3447
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
3448 /* If characters are under composition, finish the composition. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3449 #define MAYBE_FINISH_COMPOSITION() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3450 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3451 if (cmp_status->state != COMPOSING_NO) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3452 char_offset += finish_composition (charbuf, cmp_status); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3453 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3454
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3455 /* Handle composition start sequence ESC 0, ESC 2, ESC 3, or ESC 4.
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3456
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3457 ESC 0 : relative composition : ESC 0 CHAR ... ESC 1
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3458 ESC 2 : rulebase composition : ESC 2 CHAR RULE CHAR RULE ... CHAR ESC 1
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3459 ESC 3 : altchar composition : ESC 3 CHAR ... ESC 0 CHAR ... ESC 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3460 ESC 4 : alt&rule composition : ESC 4 CHAR RULE ... CHAR ESC 0 CHAR ... ESC 1
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3461
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3462 Produce this annotation sequence now:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3463
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3464 [ -LENGTH(==-4) CODING_ANNOTATE_COMPOSITION_MASK NCHARS(==0) METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3465 */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3466
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3467 #define DECODE_COMPOSITION_START(c1) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3468 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3469 if (c1 == '0' \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3470 && ((cmp_status->state == COMPOSING_COMPONENT_CHAR \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3471 && cmp_status->method == COMPOSITION_WITH_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3472 || (cmp_status->state == COMPOSING_COMPONENT_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3473 && cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS))) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3474 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3475 *charbuf++ = -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3476 *charbuf++= -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3477 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3478 cmp_status->length += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3479 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3480 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3481 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3482 MAYBE_FINISH_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3483 cmp_status->method = (c1 == '0' ? COMPOSITION_RELATIVE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3484 : c1 == '2' ? COMPOSITION_WITH_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3485 : c1 == '3' ? COMPOSITION_WITH_ALTCHARS \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3486 : COMPOSITION_WITH_RULE_ALTCHARS); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3487 cmp_status->state \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3488 = (c1 <= '2' ? COMPOSING_CHAR : COMPOSING_COMPONENT_CHAR); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3489 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3490 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3491 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3492 coding->annotated = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3493 } \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3494 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3495
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3496
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3497 /* Handle composition end sequence ESC 1. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3498
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3499 #define DECODE_COMPOSITION_END() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3500 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3501 if (cmp_status->nchars == 0 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3502 || ((cmp_status->state == COMPOSING_CHAR) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3503 == (cmp_status->method == COMPOSITION_WITH_RULE))) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3504 { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3505 MAYBE_FINISH_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3506 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3507 } \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3508 if (cmp_status->method == COMPOSITION_WITH_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3509 charbuf[- cmp_status->length] -= cmp_status->ncomps + 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3510 else if (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3511 charbuf[- cmp_status->length] -= cmp_status->ncomps * 3; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3512 charbuf[- cmp_status->length + 2] = cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3513 char_offset += cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3514 cmp_status->state = COMPOSING_NO; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3515 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3516
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3517 /* Store a composition rule RULE in charbuf, and update cmp_status. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3518
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3519 #define STORE_COMPOSITION_RULE(rule) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3520 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3521 *charbuf++ = -2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3522 *charbuf++ = rule; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3523 cmp_status->length += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3524 cmp_status->state--; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3525 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3526
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3527 /* Store a composed char or a component char C in charbuf, and update
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3528 cmp_status. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3529
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3530 #define STORE_COMPOSITION_CHAR(c) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3531 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3532 *charbuf++ = (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3533 cmp_status->length++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3534 if (cmp_status->state == COMPOSING_CHAR) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3535 cmp_status->nchars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3536 else \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3537 cmp_status->ncomps++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3538 if (cmp_status->method == COMPOSITION_WITH_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3539 || (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3540 && cmp_status->state == COMPOSING_COMPONENT_CHAR)) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3541 cmp_status->state++; \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3542 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3543
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3544
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3545 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3546
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3547 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
3548 decode_coding_iso_2022 (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3549 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3550 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3551 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3552 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3553 int *charbuf = coding->charbuf + coding->charbuf_used;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
3554 /* We may produce two annotations (charset and composition) in one
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
3555 loop and one more charset annotation at the end. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3556 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
3557 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 3);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3558 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3559 int multibytep = coding->src_multibyte;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3560 /* Charsets invoked to graphic plane 0 and 1 respectively. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3561 int charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3562 int charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3563 int charset_id_2, charset_id_3;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3564 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3565 int c;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3566 struct composition_status *cmp_status = CODING_ISO_CMP_STATUS (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3567 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3568 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3569 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3570 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
3571 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
3572 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3573 int byte_after_cr = -1;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3574 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3575
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3576 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3577 setup_iso_safe_charsets (attrs);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3578 /* Charset list may have been changed. */
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3579 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3580 coding->safe_charsets = SDATA (CODING_ATTR_SAFE_CHARSETS (attrs));
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3581
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3582 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3583 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3584 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3585 *charbuf++ = cmp_status->carryover[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3586 coding->annotated = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3587 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3588
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3589 while (1)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3590 {
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3591 int c1, c2, c3;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3592
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3593 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3594 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3595
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3596 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3597 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3598 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3599 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3600 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3601 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3602
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3603 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3604 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3605 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3606 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3607 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3608 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3609
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3610 if (CODING_ISO_EXTSEGMENT_LEN (coding) > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3611 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3612 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3613 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3614 CODING_ISO_EXTSEGMENT_LEN (coding)--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3615 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3616 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3617
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3618 if (CODING_ISO_EMBEDDED_UTF_8 (coding))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3619 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3620 if (c1 == ISO_CODE_ESC)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3621 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3622 if (src + 1 >= src_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3623 goto no_more_source;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3624 *charbuf++ = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3625 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3626 if (src[0] == '%' && src[1] == '@')
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3627 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3628 src += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3629 consumed_chars += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3630 char_offset += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3631 /* We are sure charbuf can contain two more chars. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3632 *charbuf++ = '%';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3633 *charbuf++ = '@';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3634 CODING_ISO_EMBEDDED_UTF_8 (coding) = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3635 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3636 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3637 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3638 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3639 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3640 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3641 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3642 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3643 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3644
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3645 if ((cmp_status->state == COMPOSING_RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3646 || cmp_status->state == COMPOSING_COMPONENT_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3647 && c1 != ISO_CODE_ESC)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3648 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3649 int rule, nbytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3650
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3651 DECODE_COMPOSITION_RULE (rule, nbytes);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3652 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3653 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3654 STORE_COMPOSITION_RULE (rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3655 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3656 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3657
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
3658 /* We produce at most one character. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3659 switch (iso_code_class [c1])
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3660 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3661 case ISO_0x20_or_0x7F:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3662 if (charset_id_0 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3663 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_0)))
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3664 /* This is SPACE or DEL. */
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3665 charset = CHARSET_FROM_ID (charset_ascii);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3666 else
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3667 charset = CHARSET_FROM_ID (charset_id_0);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3668 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3669
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3670 case ISO_graphic_plane_0:
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3671 if (charset_id_0 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3672 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3673 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3674 charset = CHARSET_FROM_ID (charset_id_0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3675 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3676
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3677 case ISO_0xA0_or_0xFF:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3678 if (charset_id_1 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3679 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3680 || CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3681 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3682 /* This is a graphic character, we fall down ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3683
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3684 case ISO_graphic_plane_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3685 if (charset_id_1 < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3686 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3687 charset = CHARSET_FROM_ID (charset_id_1);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3688 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3689
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3690 case ISO_control_0:
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3691 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3692 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3693 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3694 charset = CHARSET_FROM_ID (charset_ascii);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3695 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3696
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3697 case ISO_control_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3698 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3699
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3700 case ISO_shift_out:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3701 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3702 || CODING_ISO_DESIGNATION (coding, 1) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3703 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3704 CODING_ISO_INVOCATION (coding, 0) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3705 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3706 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3707
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3708 case ISO_shift_in:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3709 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3710 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3711 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3712 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3713 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3714
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3715 case ISO_single_shift_2_7:
106564
fea46c7aca79 (decode_coding_iso_2022): Ignore ISO_CODE_SS2_7 (0x19)
Kenichi Handa <handa@m17n.org>
parents: 105959
diff changeset
3716 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS))
fea46c7aca79 (decode_coding_iso_2022): Ignore ISO_CODE_SS2_7 (0x19)
Kenichi Handa <handa@m17n.org>
parents: 105959
diff changeset
3717 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3718 case ISO_single_shift_2:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3719 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3720 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3721 /* SS2 is handled as an escape sequence of ESC 'N' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3722 c1 = 'N';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3723 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3724
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3725 case ISO_single_shift_3:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3726 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3727 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3728 /* SS2 is handled as an escape sequence of ESC 'O' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3729 c1 = 'O';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3730 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3731
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3732 case ISO_control_sequence_introducer:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3733 /* CSI is handled as an escape sequence of ESC '[' ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3734 c1 = '[';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3735 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3736
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3737 case ISO_escape:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3738 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3739 label_escape_sequence:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3740 /* Escape sequences handled here are invocation,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3741 designation, direction specification, and character
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3742 composition specification. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3743 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3744 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3745 case '&': /* revision of following character set */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3746 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3747 if (!(c1 >= '@' && c1 <= '~'))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3748 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3749 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3750 if (c1 != ISO_CODE_ESC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3751 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3752 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3753 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3754
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3755 case '$': /* designation of 2-byte character set */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3756 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3757 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3758 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3759 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3760
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3761 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3762 if (c1 >= '@' && c1 <= 'B')
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3763 { /* designation of JISX0208.1978, GB2312.1980,
23339
2da87b489590 (check_composing_code): Fix previous change. Now it
Kenichi Handa <handa@m17n.org>
parents: 23325
diff changeset
3764 or JISX0208.1980 */
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3765 reg = 0, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3766 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3767 else if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3768 { /* designation of DIMENSION2_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3769 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3770 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3771 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3772 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3773 { /* designation of DIMENSION2_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3774 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3775 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3776 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3777 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3778 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3779 DECODE_DESIGNATION (reg, 2, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3780 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3781 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3782 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3783 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3784 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3785 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3786 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3787 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3788 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3789
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3790 case 'n': /* invocation of locking-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3791 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3792 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3793 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3794 CODING_ISO_INVOCATION (coding, 0) = 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3795 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3796 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3797
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3798 case 'o': /* invocation of locking-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3799 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3800 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3801 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3802 CODING_ISO_INVOCATION (coding, 0) = 3;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3803 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3804 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3805
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3806 case 'N': /* invocation of single-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3807 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3808 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3809 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3810 charset_id_2 = CODING_ISO_DESIGNATION (coding, 2);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3811 if (charset_id_2 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3812 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3813 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3814 charset = CHARSET_FROM_ID (charset_id_2);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3815 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3816 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3817 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3818 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3819
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3820 case 'O': /* invocation of single-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3821 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3822 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3823 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3824 charset_id_3 = CODING_ISO_DESIGNATION (coding, 3);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3825 if (charset_id_3 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3826 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3827 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3828 charset = CHARSET_FROM_ID (charset_id_3);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3829 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3830 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3831 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3832 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3833
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3834 case '0': case '2': case '3': case '4': /* start composition */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3835 if (! (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3836 goto invalid_code;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3837 if (last_id != charset_ascii)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3838 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3839 ADD_CHARSET_DATA (charbuf, char_offset- last_offset, last_id);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3840 last_id = charset_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3841 last_offset = char_offset;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3842 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3843 DECODE_COMPOSITION_START (c1);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3844 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3845
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3846 case '1': /* end composition */
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3847 if (cmp_status->state == COMPOSING_NO)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3848 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3849 DECODE_COMPOSITION_END ();
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3850 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3851
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3852 case '[': /* specification of direction */
105179
8143cdf4806f (decode_coding_iso_2022): Fix operator precedence.
Andreas Schwab <schwab@linux-m68k.org>
parents: 104636
diff changeset
3853 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DIRECTION))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3854 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3855 /* For the moment, nested direction is not supported.
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3856 So, `coding->mode & CODING_MODE_DIRECTION' zero means
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
3857 left-to-right, and nonzero means right-to-left. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3858 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3859 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3860 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3861 case ']': /* end of the current direction */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3862 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3863
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3864 case '0': /* end of the current direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3865 case '1': /* start of left-to-right direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3866 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3867 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3868 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3869 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3870 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3871 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3872
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3873 case '2': /* start of right-to-left direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3874 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3875 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3876 coding->mode |= CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3877 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3878 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3879 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3880
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3881 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3882 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3883 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3884 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3885
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3886 case '%':
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3887 ONE_MORE_BYTE (c1);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3888 if (c1 == '/')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3889 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3890 /* CTEXT extended segment:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3891 ESC % / [0-4] M L --ENCODING-NAME-- \002 --BYTES--
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3892 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3893 They may be decoded by post-read-conversion. */
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3894 int dim, M, L;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3895 int size;
56191
75f56340b4f9 (MAX_ALLOCA): Remove define.
Kim F. Storm <storm@cua.dk>
parents: 56028
diff changeset
3896
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3897 ONE_MORE_BYTE (dim);
109710
62d9702eb261 Improve the encoding by compound-text-with-extensions.
Kenichi Handa <handa@etlken>
parents: 107507
diff changeset
3898 if (dim < '0' || dim > '4')
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3899 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3900 ONE_MORE_BYTE (M);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3901 if (M < 128)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3902 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3903 ONE_MORE_BYTE (L);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3904 if (L < 128)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3905 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3906 size = ((M - 128) * 128) + (L - 128);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3907 if (charbuf + 6 > charbuf_end)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3908 goto break_loop;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3909 *charbuf++ = ISO_CODE_ESC;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3910 *charbuf++ = '%';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3911 *charbuf++ = '/';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3912 *charbuf++ = dim;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3913 *charbuf++ = BYTE8_TO_CHAR (M);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3914 *charbuf++ = BYTE8_TO_CHAR (L);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3915 CODING_ISO_EXTSEGMENT_LEN (coding) = size;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3916 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3917 else if (c1 == 'G')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3918 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3919 /* XFree86 extension for embedding UTF-8 in CTEXT:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3920 ESC % G --UTF-8-BYTES-- ESC % @
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3921 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3922 They may be decoded by post-read-conversion. */
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3923 if (charbuf + 3 > charbuf_end)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3924 goto break_loop;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3925 *charbuf++ = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3926 *charbuf++ = '%';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3927 *charbuf++ = 'G';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3928 CODING_ISO_EMBEDDED_UTF_8 (coding) = 1;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3929 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3930 else
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3931 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3932 continue;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3933 break;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3934
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3935 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3936 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3937 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3938 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3939 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3940
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3941 if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3942 { /* designation of DIMENSION1_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3943 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3944 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3945 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3946 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3947 { /* designation of DIMENSION1_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3948 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3949 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3950 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3951 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3952 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3953 DECODE_DESIGNATION (reg, 1, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3954 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3955 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3956 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3957 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3958 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3959 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3960 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3961 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3962 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3963 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3964 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3965
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3966 if (cmp_status->state == COMPOSING_NO
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3967 && charset->id != charset_ascii
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3968 && last_id != charset->id)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3969 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3970 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3971 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3972 last_id = charset->id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3973 last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3974 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3975
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3976 /* Now we know CHARSET and 1st position code C1 of a character.
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3977 Produce a decoded character while getting 2nd and 3rd
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3978 position codes C2, C3 if necessary. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3979 if (CHARSET_DIMENSION (charset) > 1)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3980 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3981 ONE_MORE_BYTE (c2);
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3982 if (c2 < 0x20 || (c2 >= 0x80 && c2 < 0xA0)
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3983 || ((c1 & 0x80) != (c2 & 0x80)))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3984 /* C2 is not in a valid range. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3985 goto invalid_code;
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3986 if (CHARSET_DIMENSION (charset) == 2)
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3987 c1 = (c1 << 8) | c2;
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3988 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3989 {
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3990 ONE_MORE_BYTE (c3);
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3991 if (c3 < 0x20 || (c3 >= 0x80 && c3 < 0xA0)
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3992 || ((c1 & 0x80) != (c3 & 0x80)))
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3993 /* C3 is not in a valid range. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3994 goto invalid_code;
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3995 c1 = (c1 << 16) | (c2 << 8) | c2;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3996 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3997 }
103474
7ead50363544 (decode_coding_iso_2022): Check MSB of bytes more rigidly.
Kenichi Handa <handa@m17n.org>
parents: 103448
diff changeset
3998 c1 &= 0x7F7F7F;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3999 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c1, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4000 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4001 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4002 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4003 for (; src_base < src; src_base++, char_offset++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4004 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4005 if (ASCII_BYTE_P (*src_base))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4006 *charbuf++ = *src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4007 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4008 *charbuf++ = BYTE8_TO_CHAR (*src_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4009 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4010 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4011 else if (cmp_status->state == COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4012 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4013 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4014 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4015 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4016 else if ((cmp_status->state == COMPOSING_CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4017 ? cmp_status->nchars
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4018 : cmp_status->ncomps)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4019 >= MAX_COMPOSITION_COMPONENTS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4020 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4021 /* Too long composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4022 MAYBE_FINISH_COMPOSITION ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4023 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4024 char_offset++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4025 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4026 else
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4027 STORE_COMPOSITION_CHAR (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4028 continue;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4029
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4030 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4031 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4032 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4033 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4034 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4035 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4036 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4037 coding->errors++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4038 continue;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4039
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4040 break_loop:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4041 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4042 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4043
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4044 no_more_source:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4045 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4046 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4047 if (coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4048 MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4049 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4050 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4051 charbuf -= cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4052 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4053 cmp_status->carryover[i] = charbuf[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4054 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4055 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4056 else if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4057 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4058 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4059 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4060 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4061 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4062
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4063
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4064 /* ISO2022 encoding stuff. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4065
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4066 /*
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4067 It is not enough to say just "ISO2022" on encoding, we have to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4068 specify more details. In Emacs, each coding system of ISO2022
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4069 variant has the following specifications:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4070 1. Initial designation to G0 thru G3.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4071 2. Allows short-form designation?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4072 3. ASCII should be designated to G0 before control characters?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4073 4. ASCII should be designated to G0 at end of line?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4074 5. 7-bit environment or 8-bit environment?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4075 6. Use locking-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4076 7. Use Single-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4077 And the following two are only for Japanese:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4078 8. Use ASCII in place of JIS0201-1976-Roman?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4079 9. Use JISX0208-1983 in place of JISX0208-1978?
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4080 These specifications are encoded in CODING_ISO_FLAGS (coding) as flag bits
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4081 defined by macros CODING_ISO_FLAG_XXX. See `coding.h' for more
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4082 details.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4083 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4084
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4085 /* Produce codes (escape sequence) for designating CHARSET to graphic
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4086 register REG at DST, and increment DST. If <final-char> of CHARSET is
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4087 '@', 'A', or 'B' and the coding system CODING allows, produce
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4088 designation sequence of short-form. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4089
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4090 #define ENCODE_DESIGNATION(charset, reg, coding) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4091 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4092 unsigned char final_char = CHARSET_ISO_FINAL (charset); \
109717
8949aad5e992 Use const char* instead of char*.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109573
diff changeset
4093 const char *intermediate_char_94 = "()*+"; \
8949aad5e992 Use const char* instead of char*.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109573
diff changeset
4094 const char *intermediate_char_96 = ",-./"; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4095 int revision = -1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4096 int c; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4097 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4098 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_REVISION) \
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
4099 revision = CHARSET_ISO_REVISION (charset); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4100 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4101 if (revision >= 0) \
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
4102 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4103 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '&'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4104 EMIT_ONE_BYTE ('@' + revision); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4105 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4106 EMIT_ONE_ASCII_BYTE (ISO_CODE_ESC); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4107 if (CHARSET_DIMENSION (charset) == 1) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4108 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4109 if (! CHARSET_ISO_CHARS_96 (charset)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4110 c = intermediate_char_94[reg]; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4111 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4112 c = intermediate_char_96[reg]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4113 EMIT_ONE_ASCII_BYTE (c); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4114 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4115 else \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4116 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4117 EMIT_ONE_ASCII_BYTE ('$'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4118 if (! CHARSET_ISO_CHARS_96 (charset)) \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4119 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4120 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LONG_FORM \
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4121 || reg != 0 \
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4122 || final_char < '@' || final_char > 'B') \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4123 EMIT_ONE_ASCII_BYTE (intermediate_char_94[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4124 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4125 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4126 EMIT_ONE_ASCII_BYTE (intermediate_char_96[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4127 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4128 EMIT_ONE_ASCII_BYTE (final_char); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4129 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4130 CODING_ISO_DESIGNATION (coding, reg) = CHARSET_ID (charset); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4131 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4132
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4133
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4134 /* The following two macros produce codes (control character or escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4135 sequence) for ISO2022 single-shift functions (single-shift-2 and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4136 single-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4137
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4138 #define ENCODE_SINGLE_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4139 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4140 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4141 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'N'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4142 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4143 EMIT_ONE_BYTE (ISO_CODE_SS2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4144 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4145 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4146
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4147
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4148 #define ENCODE_SINGLE_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4149 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4150 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4151 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'O'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4152 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4153 EMIT_ONE_BYTE (ISO_CODE_SS3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4154 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4155 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4156
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4157
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4158 /* The following four macros produce codes (control character or
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4159 escape sequence) for ISO2022 locking-shift functions (shift-in,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4160 shift-out, locking-shift-2, and locking-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4161
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4162 #define ENCODE_SHIFT_IN \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4163 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4164 EMIT_ONE_ASCII_BYTE (ISO_CODE_SI); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4165 CODING_ISO_INVOCATION (coding, 0) = 0; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4166 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4167
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4168
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4169 #define ENCODE_SHIFT_OUT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4170 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4171 EMIT_ONE_ASCII_BYTE (ISO_CODE_SO); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4172 CODING_ISO_INVOCATION (coding, 0) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4173 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4174
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4175
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4176 #define ENCODE_LOCKING_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4177 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4178 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4179 CODING_ISO_INVOCATION (coding, 0) = 2; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4180 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4181
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4182
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4183 #define ENCODE_LOCKING_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4184 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4185 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4186 CODING_ISO_INVOCATION (coding, 0) = 3; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4187 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4188
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4189
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4190 /* Produce codes for a DIMENSION1 character whose character set is
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4191 CHARSET and whose position-code is C1. Designation and invocation
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4192 sequences are also produced in advance if necessary. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4193
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4194 #define ENCODE_ISO_CHARACTER_DIMENSION1(charset, c1) \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4195 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4196 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4197 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4198 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4199 && id == charset_ascii) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4200 { \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4201 id = charset_jisx0201_roman; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4202 charset = CHARSET_FROM_ID (id); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4203 } \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4204 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4205 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4206 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4207 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4208 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4209 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4210 EMIT_ONE_BYTE (c1 | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4211 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4212 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4213 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4214 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4215 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4216 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4217 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4218 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4219 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4220 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4221 EMIT_ONE_BYTE (c1 | 0x80); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4222 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4223 } \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4224 else \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4225 /* Since CHARSET is not yet invoked to any graphic planes, we \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4226 must invoke it, or, at first, designate it to some graphic \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4227 register. Then repeat the loop to actually produce the \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4228 character. */ \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4229 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4230 &produced_chars); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4231 } while (1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4232
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4233
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4234 /* Produce codes for a DIMENSION2 character whose character set is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4235 CHARSET and whose position-codes are C1 and C2. Designation and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4236 invocation codes are also produced in advance if necessary. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4237
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4238 #define ENCODE_ISO_CHARACTER_DIMENSION2(charset, c1, c2) \
24506
219c99669e4b (ENCODE_ISO_CHARACTER): Check validity of CHARSET. If
Kenichi Handa <handa@m17n.org>
parents: 24460
diff changeset
4239 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4240 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4241 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4242 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4243 && id == charset_jisx0208) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4244 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4245 id = charset_jisx0208_1978; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4246 charset = CHARSET_FROM_ID (id); \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4247 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4248 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4249 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4250 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4251 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4252 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4253 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4254 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4255 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4256 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4257 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4258 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4259 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4260 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4261 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4262 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4263 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4264 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4265 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4266 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4267 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4268 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4269 /* Since CHARSET is not yet invoked to any graphic planes, we \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4270 must invoke it, or, at first, designate it to some graphic \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4271 register. Then repeat the loop to actually produce the \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4272 character. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4273 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4274 &produced_chars); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4275 } while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4276
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4277
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4278 #define ENCODE_ISO_CHARACTER(charset, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4279 do { \
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
4280 int code = ENCODE_CHAR ((charset), (c)); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4281 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4282 if (CHARSET_DIMENSION (charset) == 1) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4283 ENCODE_ISO_CHARACTER_DIMENSION1 ((charset), code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4284 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4285 ENCODE_ISO_CHARACTER_DIMENSION2 ((charset), code >> 8, code & 0xFF); \
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
4286 } while (0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4287
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
4288
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4289 /* Produce designation and invocation codes at a place pointed by DST
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4290 to use CHARSET. The element `spec.iso_2022' of *CODING is updated.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4291 Return new DST. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4292
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4293 unsigned char *
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4294 encode_invocation_designation (struct charset *charset,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4295 struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4296 unsigned char *dst, int *p_nchars)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4297 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4298 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4299 int produced_chars = *p_nchars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4300 int reg; /* graphic register number */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4301 int id = CHARSET_ID (charset);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4302
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4303 /* At first, check designations. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4304 for (reg = 0; reg < 4; reg++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4305 if (id == CODING_ISO_DESIGNATION (coding, reg))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4306 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4307
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4308 if (reg >= 4)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4309 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4310 /* CHARSET is not yet designated to any graphic registers. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4311 /* At first check the requested designation. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4312 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4313 if (reg < 0)
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
4314 /* Since CHARSET requests no special designation, designate it
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
4315 to graphic register 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4316 reg = 0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4317
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4318 ENCODE_DESIGNATION (charset, reg, coding);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4319 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4320
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4321 if (CODING_ISO_INVOCATION (coding, 0) != reg
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4322 && CODING_ISO_INVOCATION (coding, 1) != reg)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4323 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4324 /* Since the graphic register REG is not invoked to any graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4325 planes, invoke it to graphic plane 0. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4326 switch (reg)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4327 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4328 case 0: /* graphic register 0 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4329 ENCODE_SHIFT_IN;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4330 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4331
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4332 case 1: /* graphic register 1 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4333 ENCODE_SHIFT_OUT;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4334 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4335
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4336 case 2: /* graphic register 2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4337 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4338 ENCODE_SINGLE_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4339 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4340 ENCODE_LOCKING_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4341 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4342
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4343 case 3: /* graphic register 3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4344 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4345 ENCODE_SINGLE_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4346 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4347 ENCODE_LOCKING_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4348 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4349 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4350 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4351
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4352 *p_nchars = produced_chars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4353 return dst;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4354 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4355
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4356 /* The following three macros produce codes for indicating direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4357 of text. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4358 #define ENCODE_CONTROL_SEQUENCE_INTRODUCER \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4359 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4360 if (CODING_ISO_FLAGS (coding) == CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4361 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '['); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4362 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4363 EMIT_ONE_BYTE (ISO_CODE_CSI); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4364 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4365
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4366
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4367 #define ENCODE_DIRECTION_R2L() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4368 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4369 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4370 EMIT_TWO_ASCII_BYTES ('2', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4371 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4372
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4373
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4374 #define ENCODE_DIRECTION_L2R() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4375 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4376 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4377 EMIT_TWO_ASCII_BYTES ('0', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4378 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4379
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4380
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4381 /* Produce codes for designation and invocation to reset the graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4382 planes and registers to initial state. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4383 #define ENCODE_RESET_PLANE_AND_REGISTER() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4384 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4385 int reg; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4386 struct charset *charset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4387 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4388 if (CODING_ISO_INVOCATION (coding, 0) != 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4389 ENCODE_SHIFT_IN; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4390 for (reg = 0; reg < 4; reg++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4391 if (CODING_ISO_INITIAL (coding, reg) >= 0 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4392 && (CODING_ISO_DESIGNATION (coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4393 != CODING_ISO_INITIAL (coding, reg))) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4394 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4395 charset = CHARSET_FROM_ID (CODING_ISO_INITIAL (coding, reg)); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4396 ENCODE_DESIGNATION (charset, reg, coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4397 } \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4398 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4399
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4400
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4401 /* Produce designation sequences of charsets in the line started from
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4402 SRC to a place pointed by DST, and return updated DST.
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4403
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4404 If the current block ends before any end-of-line, we may fail to
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4405 find all the necessary designations. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4406
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4407 static unsigned char *
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4408 encode_designation_at_bol (struct coding_system *coding, int *charbuf,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4409 int *charbuf_end, unsigned char *dst)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4410 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4411 struct charset *charset;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4412 /* Table of charsets to be designated to each graphic register. */
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4413 int r[4];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4414 int c, found = 0, reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4415 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4416 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4417 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4418 Lisp_Object charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4419
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4420 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4421 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4422 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4423 charset_list = Viso_2022_charset_list;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4424
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4425 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4426 r[reg] = -1;
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4427
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4428 while (found < 4)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4429 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4430 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4431
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4432 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4433 if (c == '\n')
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4434 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4435 charset = char_charset (c, charset_list, NULL);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4436 id = CHARSET_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4437 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4438 if (reg >= 0 && r[reg] < 0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4439 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4440 found++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4441 r[reg] = id;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4442 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4443 }
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4444
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4445 if (found)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4446 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4447 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4448 if (r[reg] >= 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4449 && CODING_ISO_DESIGNATION (coding, reg) != r[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4450 ENCODE_DESIGNATION (CHARSET_FROM_ID (r[reg]), reg, coding);
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4451 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4452
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4453 return dst;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4454 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4455
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4456 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4457
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4458 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
4459 encode_coding_iso_2022 (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4460 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4461 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4462 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4463 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4464 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4465 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4466 int safe_room = 16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4467 int bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4468 = (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4469 && CODING_ISO_BOL (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4470 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4471 Lisp_Object attrs, eol_type, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4472 int ascii_compatible;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4473 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4474 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4475
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4476 CODING_GET_INFO (coding, attrs, charset_list);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4477 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4478 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4479 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4480
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
4481 setup_iso_safe_charsets (attrs);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4482 /* Charset list may have been changed. */
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
4483 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
4484 coding->safe_charsets = SDATA (CODING_ATTR_SAFE_CHARSETS (attrs));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4485
110336
3ffb3b102dae coding.c (encode_coding_iso_2022): Do not optimize for ASCII if we may use designation or locking-shift.
Kenichi Handa <handa@m17n.org>
parents: 110334
diff changeset
4486 ascii_compatible
3ffb3b102dae coding.c (encode_coding_iso_2022): Do not optimize for ASCII if we may use designation or locking-shift.
Kenichi Handa <handa@m17n.org>
parents: 110334
diff changeset
4487 = (! NILP (CODING_ATTR_ASCII_COMPAT (attrs))
3ffb3b102dae coding.c (encode_coding_iso_2022): Do not optimize for ASCII if we may use designation or locking-shift.
Kenichi Handa <handa@m17n.org>
parents: 110334
diff changeset
4488 && ! (CODING_ISO_FLAGS (coding) & (CODING_ISO_FLAG_DESIGNATION
3ffb3b102dae coding.c (encode_coding_iso_2022): Do not optimize for ASCII if we may use designation or locking-shift.
Kenichi Handa <handa@m17n.org>
parents: 110334
diff changeset
4489 | CODING_ISO_FLAG_LOCKING_SHIFT)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4490
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4491 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4492 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4493 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4494
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4495 if (bol_designation)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4496 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4497 unsigned char *dst_prev = dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4498
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4499 /* We have to produce designation sequences if any now. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4500 dst = encode_designation_at_bol (coding, charbuf, charbuf_end, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4501 bol_designation = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4502 /* We are sure that designation sequences are all ASCII bytes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4503 produced_chars += dst - dst_prev;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4504 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4505
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4506 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4507
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4508 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4509 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4510 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4511 switch (*charbuf)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4512 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4513 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4514 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4515 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4516 case CODING_ANNOTATE_CHARSET_MASK:
90014
ade0c9a12f99 (encode_coding_iso_2022): Fix handling of charset
Kenichi Handa <handa@m17n.org>
parents: 90011
diff changeset
4517 preferred_charset_id = charbuf[2];
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4518 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4519 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4520 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4521 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4522 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4523 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4524 abort ();
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
4525 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4526 charbuf += -c - 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4527 continue;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4528 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4529
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4530 /* Now encode the character C. */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4531 if (c < 0x20 || c == 0x7F)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4532 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4533 if (c == '\n'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4534 || (c == '\r' && EQ (eol_type, Qmac)))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4535 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4536 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4537 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4538 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_INIT_AT_BOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4539 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4540 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4541
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4542 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4543 CODING_ISO_DESIGNATION (coding, i)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4544 = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4545 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4546 bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4547 = CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL;
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4548 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4549 else if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_CNTL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4550 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4551 EMIT_ONE_ASCII_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4552 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4553 else if (ASCII_CHAR_P (c))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4554 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4555 if (ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4556 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4557 else
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4558 {
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4559 struct charset *charset = CHARSET_FROM_ID (charset_ascii);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4560 ENCODE_ISO_CHARACTER (charset, c);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4561 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4562 }
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4563 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4564 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4565 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4566 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4567 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4568 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4569 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4570 struct charset *charset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4571
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4572 if (preferred_charset_id >= 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4573 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4574 charset = CHARSET_FROM_ID (preferred_charset_id);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4575 if (! CHAR_CHARSET_P (c, charset))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4576 charset = char_charset (c, charset_list, NULL);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4577 }
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
4578 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4579 charset = char_charset (c, charset_list, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4580 if (!charset)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4581 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4582 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4583 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4584 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4585 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4586 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4587 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4588 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4589 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4590 charset = char_charset (c, charset_list, NULL);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4591 }
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4592 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4593 ENCODE_ISO_CHARACTER (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4594 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4595 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4596
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4597 if (coding->mode & CODING_MODE_LAST_BLOCK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4598 && CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4599 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4600 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4601 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4602 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4603 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4604 CODING_ISO_BOL (coding) = bol_designation;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4605 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4606 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4607 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4608 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4609
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4610
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4611 /*** 8,9. SJIS and BIG5 handlers ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4612
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4613 /* Although SJIS and BIG5 are not ISO's coding system, they are used
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4614 quite widely. So, for the moment, Emacs supports them in the bare
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4615 C code. But, in the future, they may be supported only by CCL. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4616
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4617 /* SJIS is a coding system encoding three character sets: ASCII, right
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4618 half of JISX0201-Kana, and JISX0208. An ASCII character is encoded
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4619 as is. A character of charset katakana-jisx0201 is encoded by
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4620 "position-code + 0x80". A character of charset japanese-jisx0208
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4621 is encoded in 2-byte but two position-codes are divided and shifted
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4622 so that it fit in the range below.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4623
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4624 --- CODE RANGE of SJIS ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4625 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4626 ASCII 0x00 .. 0x7F
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4627 KATAKANA-JISX0201 0xA0 .. 0xDF
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
4628 JISX0208 (1st byte) 0x81 .. 0x9F and 0xE0 .. 0xEF
23564
6eb3e346d1fd (DECODE_CHARACTER_ASCII): Check validity of inserted
Kenichi Handa <handa@m17n.org>
parents: 23542
diff changeset
4629 (2nd byte) 0x40 .. 0x7E and 0x80 .. 0xFC
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4630 -------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4631
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4632 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4633
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4634 /* BIG5 is a coding system encoding two character sets: ASCII and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4635 Big5. An ASCII character is encoded as is. Big5 is a two-byte
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4636 character set and is encoded in two-byte.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4637
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4638 --- CODE RANGE of BIG5 ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4639 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4640 ASCII 0x00 .. 0x7F
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4641 Big5 (1st byte) 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4642 (2nd byte) 0x40 .. 0x7E and 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4643 --------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4644
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4645 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4646
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4647 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4648 Check if a text is encoded in SJIS. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4649 CATEGORY_MASK_SJIS, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4650
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4651 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4652 detect_coding_sjis (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4653 struct coding_detection_info *detect_info)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4654 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4655 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4656 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4657 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4658 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4659 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4660 int c;
103762
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4661 Lisp_Object attrs, charset_list;
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4662 int max_first_byte_of_2_byte_code;
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4663
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4664 CODING_GET_INFO (coding, attrs, charset_list);
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4665 max_first_byte_of_2_byte_code
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4666 = (XINT (Flength (charset_list)) > 3 ? 0xFC : 0xEF);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4667
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4668 detect_info->checked |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4669 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4670 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4671
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4672 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4673 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4674 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4675 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4676 if (c < 0x80)
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4677 continue;
103762
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4678 if ((c >= 0x81 && c <= 0x9F)
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
4679 || (c >= 0xE0 && c <= max_first_byte_of_2_byte_code))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4680 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4681 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4682 if (c < 0x40 || c == 0x7F || c > 0xFC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4683 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4684 found = CATEGORY_MASK_SJIS;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4685 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4686 else if (c >= 0xA0 && c < 0xE0)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4687 found = CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4688 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4689 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4690 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4691 detect_info->rejected |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4692 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4693
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4694 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4695 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4696 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4697 detect_info->rejected |= CATEGORY_MASK_SJIS;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4698 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4699 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4700 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4701 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4702 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4703
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4704 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4705 Check if a text is encoded in BIG5. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4706 CATEGORY_MASK_BIG5, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4707
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4708 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4709 detect_coding_big5 (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
4710 struct coding_detection_info *detect_info)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4711 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4712 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4713 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4714 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4715 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4716 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4717 int c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4718
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4719 detect_info->checked |= CATEGORY_MASK_BIG5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4720 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4721 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4722
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4723 while (1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4724 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4725 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4726 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4727 if (c < 0x80)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4728 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4729 if (c >= 0xA1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4730 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4731 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4732 if (c < 0x40 || (c >= 0x7F && c <= 0xA0))
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4733 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4734 found = CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4735 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4736 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4737 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4738 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4739 detect_info->rejected |= CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4740 return 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4741
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4742 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4743 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4744 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4745 detect_info->rejected |= CATEGORY_MASK_BIG5;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4746 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4747 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4748 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4749 return 1;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4750 }
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4751
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4752 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4753 If SJIS_P is 1, decode SJIS text, else decode BIG5 test. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4754
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4755 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
4756 decode_coding_sjis (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4757 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4758 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4759 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
4760 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4761 int *charbuf = coding->charbuf + coding->charbuf_used;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
4762 /* We may produce one charset annotation in one loop and one more at
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4763 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4764 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4765 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4766 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4767 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4768 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4769 struct charset *charset_kanji2;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4770 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4771 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4772 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4773 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4774 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4775 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4776 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4777
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4778 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4779
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4780 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4781 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4782 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4783 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4784 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4785
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4786 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4787 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4788 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4789 struct charset *charset;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4790
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4791 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4792 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4793
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4794 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4795 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4796 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4797 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4798 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4799 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4800
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4801 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4802 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4803 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4804 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4805 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4806 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4807 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4808 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4809 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4810 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4811 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4812 }
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4813 else if (c == 0x80 || c == 0xA0)
89730
d8fcefca5cf6 (decode_coding_sjis): Check the first byte rigidly.
Kenichi Handa <handa@m17n.org>
parents: 89686
diff changeset
4814 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4815 else if (c >= 0xA1 && c <= 0xDF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4816 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4817 /* SJIS -> JISX0201-Kana */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4818 c &= 0x7F;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4819 charset = charset_kana;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4820 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4821 else if (c <= 0xEF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4822 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4823 /* SJIS -> JISX0208 */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4824 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4825 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4826 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4827 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4828 SJIS_TO_JIS (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4829 charset = charset_kanji;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4830 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4831 else if (c <= 0xFC && charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4832 {
89779
74c503490829 (decode_coding_sjis): Fix comment.
Kenichi Handa <handa@m17n.org>
parents: 89764
diff changeset
4833 /* SJIS -> JISX0213-2 */
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4834 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4835 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4836 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4837 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4838 SJIS_TO_JIS2 (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4839 charset = charset_kanji2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4840 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4841 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4842 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4843 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4844 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4845 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4846 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4847 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4848 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4849 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4850 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4851 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4852 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4853 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4854 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4855
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4856 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4857 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4858 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4859 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4860 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4861 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4862 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4863 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4864
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4865 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4866 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4867 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4868 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4869 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4870 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4871 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4872
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4873 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
4874 decode_coding_big5 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4875 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4876 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4877 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4878 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4879 int *charbuf = coding->charbuf + coding->charbuf_used;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
4880 /* We may produce one charset annotation in one loop and one more at
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4881 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4882 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4883 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4884 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4885 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4886 struct charset *charset_roman, *charset_big5;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4887 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4888 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4889 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4890 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4891 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4892 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4893 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4894
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4895 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4896 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4897 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4898 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4899
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4900 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4901 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4902 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4903 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4904
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4905 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4906 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4907
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4908 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4909 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4910 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4911 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4912 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4913 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4914
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4915 if (byte_after_cr >= 0)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4916 c = byte_after_cr, byte_after_cr = -1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4917 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4918 ONE_MORE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4919
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4920 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4921 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4922 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4923 {
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4924 if (eol_crlf && c == '\r')
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4925 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4926 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4927 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4928 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4929 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4930 /* BIG5 -> Big5 */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4931 if (c < 0xA1 || c > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4932 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4933 ONE_MORE_BYTE (c1);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4934 if (c1 < 0x40 || (c1 > 0x7E && c1 < 0xA1) || c1 > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4935 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4936 c = c << 8 | c1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4937 charset = charset_big5;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4938 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4939 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4940 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4941 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4942 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4943 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4944 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4945 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4946 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4947 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4948 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4949 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4950 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4951
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4952 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4953 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4954 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4955 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4956 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4957 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4958 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4959 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4960
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4961 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4962 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4963 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4964 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4965 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4966 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4967 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4968
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4969 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions".
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4970 This function can encode charsets `ascii', `katakana-jisx0201',
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4971 `japanese-jisx0208', `chinese-big5-1', and `chinese-big5-2'. We
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4972 are sure that all these charsets are registered as official charset
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4973 (i.e. do not have extended leading-codes). Characters of other
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4974 charsets are produced without any encoding. If SJIS_P is 1, encode
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4975 SJIS text, else encode BIG5 text. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4976
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4977 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
4978 encode_coding_sjis (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4979 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4980 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4981 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4982 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4983 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4984 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4985 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4986 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4987 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4988 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4989 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4990 struct charset *charset_kanji2;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4991 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4992
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4993 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4994 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4995 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4996 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4997 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4998 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4999
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5000 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5001
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5002 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5003 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5004 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5005 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5006 /* Now encode the character C. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5007 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5008 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5009 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5010 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5011 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5012 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5013 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5014 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5015 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5016 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5017 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5018
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5019 if (!charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5020 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5021 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5022 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5023 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5024 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5025 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5026 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5027 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5028 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5029 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5030 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5031 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5032 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5033 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5034 if (charset == charset_kanji)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5035 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5036 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5037 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5038 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5039 EMIT_TWO_BYTES (c1, c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5040 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5041 else if (charset == charset_kana)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5042 EMIT_ONE_BYTE (code | 0x80);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5043 else if (charset_kanji2 && charset == charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5044 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5045 int c1, c2;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5046
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5047 c1 = code >> 8;
103762
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
5048 if (c1 == 0x21 || (c1 >= 0x23 && c1 <= 0x25)
e72df94a89ca (detect_coding_sjis): Handle shift_jis-2004 correctly.
Kenichi Handa <handa@m17n.org>
parents: 103655
diff changeset
5049 || c1 == 0x28
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5050 || (c1 >= 0x2C && c1 <= 0x2F) || c1 >= 0x6E)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5051 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5052 JIS_TO_SJIS2 (code);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5053 c1 = code >> 8, c2 = code & 0xFF;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5054 EMIT_TWO_BYTES (c1, c2);
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5055 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5056 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5057 EMIT_ONE_ASCII_BYTE (code & 0x7F);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5058 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5059 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5060 EMIT_ONE_ASCII_BYTE (code & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5061 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5062 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5063 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5064 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5065 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5066 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5067 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5068
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5069 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5070 encode_coding_big5 (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5071 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5072 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5073 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5074 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5075 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5076 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5077 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5078 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5079 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5080 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5081 struct charset *charset_roman, *charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5082 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5083
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5084 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5085 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5086 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5087 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5088 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5089
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5090 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5091 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5092 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5093 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5094 /* Now encode the character C. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5095 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5096 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5097 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5098 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5099 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5100 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5101 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5102 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5103 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5104 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5105 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5106
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5107 if (! charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5108 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5109 if (coding->mode & CODING_MODE_SAFE_ENCODING)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5110 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5111 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5112 charset = CHARSET_FROM_ID (charset_ascii);
51140
94d903190cee (ENCODE_UNSAFE_CHARACTER): Adjusted for the name change
Kenichi Handa <handa@m17n.org>
parents: 51090
diff changeset
5113 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5114 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5115 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5116 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5117 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5118 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5119 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5120 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5121 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5122 if (charset == charset_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5123 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5124 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5125
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5126 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5127 EMIT_TWO_BYTES (c1, c2);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5128 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5129 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5130 EMIT_ONE_ASCII_BYTE (code & 0x7F);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5131 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5132 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5133 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5134 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5135 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5136 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5137 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5138
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5139
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5140 /*** 10. CCL handlers ***/
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5141
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5142 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5143 Check if a text is encoded in a coding system of which
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5144 encoder/decoder are written in CCL program. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5145 CATEGORY_MASK_CCL, else return 0. */
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5146
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
5147 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
5148 detect_coding_ccl (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
5149 struct coding_detection_info *detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5150 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5151 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5152 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5153 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5154 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5155 int found = 0;
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
5156 unsigned char *valids;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5157 int head_ascii = coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5158 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5159
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5160 detect_info->checked |= CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5161
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5162 coding = &coding_categories[coding_category_ccl];
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
5163 valids = CODING_CCL_VALIDS (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5164 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5165 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5166 src += head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5167
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5168 while (1)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5169 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5170 int c;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5171
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5172 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5173 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5174 if (c < 0 || ! valids[c])
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5175 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5176 if ((valids[c] > 1))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5177 found = CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5178 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5179 detect_info->rejected |= CATEGORY_MASK_CCL;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5180 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5181
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5182 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5183 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5184 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5185 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5186
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5187 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5188 decode_coding_ccl (struct coding_system *coding)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5189 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
5190 const unsigned char *src = coding->source + coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5191 const unsigned char *src_end = coding->source + coding->src_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5192 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5193 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5194 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5195 int multibytep = coding->src_multibyte;
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5196 struct ccl_program *ccl = &coding->spec.ccl->ccl;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5197 int source_charbuf[1024];
107506
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5198 int source_byteidx[1025];
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5199 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5200
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5201 CODING_GET_INFO (coding, attrs, charset_list);
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5202
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5203 while (1)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5204 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
5205 const unsigned char *p = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5206 int i = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5207
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5208 if (multibytep)
107506
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5209 {
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5210 while (i < 1024 && p < src_end)
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5211 {
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5212 source_byteidx[i] = p - src;
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5213 source_charbuf[i++] = STRING_CHAR_ADVANCE (p);
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5214 }
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5215 source_byteidx[i] = p - src;
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5216 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5217 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5218 while (i < 1024 && p < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5219 source_charbuf[i++] = *p++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5220
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5221 if (p == src_end && coding->mode & CODING_MODE_LAST_BLOCK)
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5222 ccl->last_block = 1;
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5223 ccl_driver (ccl, source_charbuf, charbuf, i, charbuf_end - charbuf,
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5224 charset_list);
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5225 charbuf += ccl->produced;
107506
cd151730b160 coding.c (decode_coding_ccl): Fix previous change for the multibyte case.
Kenichi Handa <handa@m17n.org>
parents: 107323
diff changeset
5226 if (multibytep)
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5227 src += source_byteidx[ccl->consumed];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5228 else
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5229 src += ccl->consumed;
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5230 consumed_chars += ccl->consumed;
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5231 if (p == src_end || ccl->status != CCL_STAT_SUSPEND_BY_SRC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5232 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5233 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5234
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5235 switch (ccl->status)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5236 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5237 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5238 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5239 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5240 case CCL_STAT_SUSPEND_BY_DST:
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
5241 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5242 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5243 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5244 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5245 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5246 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5247 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5248 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5249 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5250 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5251 coding->consumed_char += consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5252 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5253 coding->charbuf_used = charbuf - coding->charbuf;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5254 }
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5255
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5256 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5257 encode_coding_ccl (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5258 {
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5259 struct ccl_program *ccl = &coding->spec.ccl->ccl;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5260 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5261 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5262 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5263 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5264 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5265 int destination_charbuf[1024];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5266 int i, produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5267 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5268
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5269 CODING_GET_INFO (coding, attrs, charset_list);
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5270 if (coding->consumed_char == coding->src_chars
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5271 && coding->mode & CODING_MODE_LAST_BLOCK)
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5272 ccl->last_block = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5273
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5274 while (charbuf < charbuf_end)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5275 {
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5276 ccl_driver (ccl, charbuf, destination_charbuf,
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5277 charbuf_end - charbuf, 1024, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5278 if (multibytep)
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5279 {
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5280 ASSURE_DESTINATION (ccl->produced * 2);
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5281 for (i = 0; i < ccl->produced; i++)
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5282 EMIT_ONE_BYTE (destination_charbuf[i] & 0xFF);
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5283 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5284 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5285 {
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5286 ASSURE_DESTINATION (ccl->produced);
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5287 for (i = 0; i < ccl->produced; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5288 *dst++ = destination_charbuf[i] & 0xFF;
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5289 produced_chars += ccl->produced;
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5290 }
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5291 charbuf += ccl->consumed;
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5292 if (ccl->status == CCL_STAT_QUIT
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5293 || ccl->status == CCL_STAT_INVALID_CMD)
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5294 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5295 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5296
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
5297 switch (ccl->status)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5298 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5299 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5300 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5301 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5302 case CCL_STAT_SUSPEND_BY_DST:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5303 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5304 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5305 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5306 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5307 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5308 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5309 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5310 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5311 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5312 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5313
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5314 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5315 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5316 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5317 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5318
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5319
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5320
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5321 /*** 10, 11. no-conversion handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5322
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5323 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5324
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5325 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5326 decode_coding_raw_text (struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5327 {
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5328 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5329 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5330
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5331 coding->chars_at_source = 1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5332 coding->consumed_char = coding->src_chars;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5333 coding->consumed = coding->src_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5334 if (eol_crlf && coding->source[coding->src_bytes - 1] == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5335 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5336 coding->consumed_char--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5337 coding->consumed--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5338 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5339 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5340 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5341 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5342 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5343
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5344 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5345 encode_coding_raw_text (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5346 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5347 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5348 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5349 int *charbuf_end = coding->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5350 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5351 unsigned char *dst_end = coding->destination + coding->dst_bytes;
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
5352 int produced_chars = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5353 int c;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5354
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5355 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5356 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5357 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5358
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5359 if (coding->src_multibyte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5360 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5361 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5362 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5363 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5364 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5365 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5366 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5367 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5368 c = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5369 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5370 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5371 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5372 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5373 unsigned char str[MAX_MULTIBYTE_LENGTH], *p0 = str, *p1 = str;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5374
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5375 CHAR_STRING_ADVANCE (c, p1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5376 while (p0 < p1)
88950
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5377 {
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5378 EMIT_ONE_BYTE (*p0);
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5379 p0++;
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5380 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5381 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5382 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5383 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5384 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5385 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5386 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5387 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5388 EMIT_ONE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5389 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5390 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5391 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5392 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5393 if (coding->src_multibyte)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5394 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5395 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5396
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5397 while (charbuf < charbuf_end)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5398 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5399 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5400 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5401 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5402 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5403 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5404 *dst++ = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5405 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5406 CHAR_STRING_ADVANCE (c, dst);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5407 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5408 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5409 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5410 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5411 ASSURE_DESTINATION (charbuf_end - charbuf);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5412 while (charbuf < charbuf_end && dst < dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5413 *dst++ = *charbuf++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5414 }
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
5415 produced_chars = dst - (coding->destination + coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5416 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5417 record_conversion_result (coding, CODING_RESULT_SUCCESS);
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
5418 coding->produced_char += produced_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5419 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5420 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5421 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5422
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5423 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5424 Check if a text is encoded in a charset-based coding system. If it
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5425 is, return 1, else return 0. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5426
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5427 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
5428 detect_coding_charset (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
5429 struct coding_detection_info *detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5430 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5431 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5432 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5433 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5434 int consumed_chars = 0;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5435 Lisp_Object attrs, valids, name;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5436 int found = 0;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5437 int head_ascii = coding->head_ascii;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5438 int check_latin_extra = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5439
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5440 detect_info->checked |= CATEGORY_MASK_CHARSET;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5441
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5442 coding = &coding_categories[coding_category_charset];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5443 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5444 valids = AREF (attrs, coding_attr_charset_valids);
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5445 name = CODING_ID_NAME (coding->id);
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5446 if (strncmp ((char *) SDATA (SYMBOL_NAME (name)),
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5447 "iso-8859-", sizeof ("iso-8859-") - 1) == 0
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5448 || strncmp ((char *) SDATA (SYMBOL_NAME (name)),
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5449 "iso-latin-", sizeof ("iso-latin-") - 1) == 0)
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5450 check_latin_extra = 1;
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5451
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5452 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5453 src += head_ascii;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5454
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5455 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5456 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5457 int c;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5458 Lisp_Object val;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5459 struct charset *charset;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5460 int dim, idx;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5461
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5462 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5463 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5464 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5465 continue;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5466 val = AREF (valids, c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5467 if (NILP (val))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5468 break;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5469 if (c >= 0x80)
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5470 {
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5471 if (c < 0xA0
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5472 && check_latin_extra
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5473 && (!VECTORP (Vlatin_extra_code_table)
102325
2c693a021d83 (detect_coding_charset): If not checking latin extra,
Jason Rumney <jasonr@gnu.org>
parents: 102320
diff changeset
5474 || NILP (XVECTOR (Vlatin_extra_code_table)->contents[c])))
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5475 break;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5476 found = CATEGORY_MASK_CHARSET;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5477 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5478 if (INTEGERP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5479 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5480 charset = CHARSET_FROM_ID (XFASTINT (val));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5481 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5482 for (idx = 1; idx < dim; idx++)
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5483 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5484 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5485 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5486 ONE_MORE_BYTE (c);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
5487 if (c < charset->code_space[(dim - 1 - idx) * 2]
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5488 || c > charset->code_space[(dim - 1 - idx) * 2 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5489 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5490 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5491 if (idx < dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5492 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5493 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5494 else
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5495 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5496 idx = 1;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5497 for (; CONSP (val); val = XCDR (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5498 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5499 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5500 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5501 while (idx < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5502 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5503 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5504 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5505 ONE_MORE_BYTE (c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5506 if (c < charset->code_space[(dim - 1 - idx) * 4]
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5507 || c > charset->code_space[(dim - 1 - idx) * 4 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5508 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5509 idx++;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5510 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5511 if (idx == dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5512 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5513 val = Qnil;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5514 break;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5515 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5516 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5517 if (CONSP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5518 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5519 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5520 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5521 too_short:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5522 detect_info->rejected |= CATEGORY_MASK_CHARSET;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5523 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5524
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5525 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5526 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5527 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5528 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5529
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5530 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5531 decode_coding_charset (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5532 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5533 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5534 const unsigned char *src_end = coding->source + coding->src_bytes;
46548
cb1914307488 (encode_eol, detect_coding, detect_eol):
Ken Raeburn <raeburn@raeburn.org>
parents: 46462
diff changeset
5535 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5536 int *charbuf = coding->charbuf + coding->charbuf_used;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
5537 /* We may produce one charset annotation in one loop and one more at
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
5538 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5539 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
5540 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5541 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5542 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5543 Lisp_Object attrs, charset_list, valids;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5544 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5545 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5546 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5547 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5548 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5549 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5550
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5551 CODING_GET_INFO (coding, attrs, charset_list);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5552 valids = AREF (attrs, coding_attr_charset_valids);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5553
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5554 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5555 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5556 int c;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5557 Lisp_Object val;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5558 struct charset *charset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5559 int dim;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5560 int len = 1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5561 unsigned code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5562
29093
176708661b08 (encode_eol): Fix a bug of DOS style EOL encoding.
Kenichi Handa <handa@m17n.org>
parents: 29005
diff changeset
5563 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5564 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5565
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5566 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5567 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5568 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5569 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5570 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5571 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5572
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5573 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5574 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5575 c = byte_after_cr;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5576 byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5577 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5578 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5579 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5580 ONE_MORE_BYTE (c);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5581 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5582 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5583 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5584 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5585 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5586 code = c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5587
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5588 val = AREF (valids, c);
100170
86455974b971 (decode_coding_charset): Check type of an element of
Kenichi Handa <handa@m17n.org>
parents: 100135
diff changeset
5589 if (! INTEGERP (val) && ! CONSP (val))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5590 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5591 if (INTEGERP (val))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5592 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5593 charset = CHARSET_FROM_ID (XFASTINT (val));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5594 dim = CHARSET_DIMENSION (charset);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5595 while (len < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5596 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5597 ONE_MORE_BYTE (c);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5598 code = (code << 8) | c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5599 len++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5600 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5601 CODING_DECODE_CHAR (coding, src, src_base, src_end,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5602 charset, code, c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5603 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5604 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5605 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5606 /* VAL is a list of charset IDs. It is assured that the
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5607 list is sorted by charset dimensions (smaller one
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5608 comes first). */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5609 while (CONSP (val))
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5610 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5611 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
5612 dim = CHARSET_DIMENSION (charset);
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5613 while (len < dim)
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5614 {
88598
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5615 ONE_MORE_BYTE (c);
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5616 code = (code << 8) | c;
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5617 len++;
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5618 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5619 CODING_DECODE_CHAR (coding, src, src_base,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5620 src_end, charset, code, c);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5621 if (c >= 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5622 break;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5623 val = XCDR (val);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5624 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5625 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5626 if (c < 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5627 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5628 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5629 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5630 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5631 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5632 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5633 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5634 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5635 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5636
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5637 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5638 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5639 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5640
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5641 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5642 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5643 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5644 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5645 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5646 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5647 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5648 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5649
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5650 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5651 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5652 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5653 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5654 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5655 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5656 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5657
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5658 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5659 encode_coding_charset (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5660 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5661 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5662 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5663 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5664 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5665 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5666 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5667 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5668 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5669 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5670 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5671
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5672 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5673 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5674
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5675 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5676 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5677 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5678 unsigned code;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5679
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5680 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5681 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5682 if (ascii_compatible && ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5683 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5684 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5685 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5686 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5687 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5688 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5689 else
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5690 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5691 charset = char_charset (c, charset_list, &code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5692 if (charset)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5693 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5694 if (CHARSET_DIMENSION (charset) == 1)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5695 EMIT_ONE_BYTE (code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5696 else if (CHARSET_DIMENSION (charset) == 2)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5697 EMIT_TWO_BYTES (code >> 8, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5698 else if (CHARSET_DIMENSION (charset) == 3)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5699 EMIT_THREE_BYTES (code >> 16, (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5700 else
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5701 EMIT_FOUR_BYTES (code >> 24, (code >> 16) & 0xFF,
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5702 (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5703 }
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5704 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5705 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5706 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5707 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5708 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5709 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5710 EMIT_ONE_BYTE (c);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5711 }
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5712 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5713 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5714
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5715 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5716 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5717 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5718 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5719 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5720
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5721
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5722 /*** 7. C library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5723
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5724 /* Setup coding context CODING from information about CODING_SYSTEM.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5725 If CODING_SYSTEM is nil, `no-conversion' is assumed. If
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5726 CODING_SYSTEM is invalid, signal an error. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5727
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5728 void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5729 setup_coding_system (Lisp_Object coding_system, struct coding_system *coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5730 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5731 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5732 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5733 Lisp_Object coding_type;
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
5734 Lisp_Object val;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5735
24460
be35d27a4bfb (setup_coding_system): Check for CODING_SYSTEM = nil.
Kenichi Handa <handa@m17n.org>
parents: 24425
diff changeset
5736 if (NILP (coding_system))
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
5737 coding_system = Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5738
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5739 CHECK_CODING_SYSTEM_GET_ID (coding_system, coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5740
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5741 attrs = CODING_ID_ATTRS (coding->id);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5742 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5743
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5744 coding->mode = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5745 coding->head_ascii = -1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5746 if (VECTORP (eol_type))
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5747 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5748 | CODING_REQUIRE_DETECTION_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5749 else if (! EQ (eol_type, Qunix))
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5750 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5751 | CODING_REQUIRE_ENCODING_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5752 else
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5753 coding->common_flags = 0;
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5754 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5755 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5756 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5757 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5758 if (! NILP (CODING_ATTR_FOR_UNIBYTE (attrs)))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5759 coding->common_flags |= CODING_FOR_UNIBYTE_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5760
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5761 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5762 coding->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5763 coding->safe_charsets = SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5764 coding->default_char = XINT (CODING_ATTR_DEFAULT_CHAR (attrs));
103655
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
5765 coding->carryover_bytes = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5766
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5767 coding_type = CODING_ATTR_TYPE (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5768 if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5769 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5770 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5771 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5772 coding->encoder = encode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5773 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5774 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5775 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5776 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5777 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5778 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5779
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5780 /* Invoke graphic register 0 to plane 0. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5781 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5782 /* Invoke graphic register 1 to plane 1 if we can use 8-bit. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5783 CODING_ISO_INVOCATION (coding, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5784 = (flags & CODING_ISO_FLAG_SEVEN_BITS ? -1 : 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5785 /* Setup the initial status of designation. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5786 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5787 CODING_ISO_DESIGNATION (coding, i) = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5788 /* Not single shifting initially. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5789 CODING_ISO_SINGLE_SHIFTING (coding) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5790 /* Beginning of buffer should also be regarded as bol. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5791 CODING_ISO_BOL (coding) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5792 coding->detector = detect_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5793 coding->decoder = decode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5794 coding->encoder = encode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5795 if (flags & CODING_ISO_FLAG_SAFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5796 coding->mode |= CODING_MODE_SAFE_ENCODING;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5797 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5798 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5799 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5800 if (flags & CODING_ISO_FLAG_COMPOSITION)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5801 coding->common_flags |= CODING_ANNOTATE_COMPOSITION_MASK;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5802 if (flags & CODING_ISO_FLAG_DESIGNATION)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5803 coding->common_flags |= CODING_ANNOTATE_CHARSET_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5804 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5805 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5806 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5807 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5808 coding->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5809 coding->safe_charsets = SDATA (val);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5810 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5811 CODING_ISO_FLAGS (coding) = flags;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5812 CODING_ISO_CMP_STATUS (coding)->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5813 CODING_ISO_CMP_STATUS (coding)->method = COMPOSITION_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5814 CODING_ISO_EXTSEGMENT_LEN (coding) = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5815 CODING_ISO_EMBEDDED_UTF_8 (coding) = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5816 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5817 else if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5818 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5819 coding->detector = detect_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5820 coding->decoder = decode_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5821 coding->encoder = encode_coding_charset;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5822 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5823 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5824 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5825 else if (EQ (coding_type, Qutf_8))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5826 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5827 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5828 CODING_UTF_8_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5829 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5830 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5831 coding->detector = detect_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5832 coding->decoder = decode_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5833 coding->encoder = encode_coding_utf_8;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5834 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5835 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5836 if (CODING_UTF_8_BOM (coding) == utf_detect_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5837 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5838 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5839 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5840 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5841 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5842 CODING_UTF_16_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5843 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5844 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5845 val = AREF (attrs, coding_attr_utf_16_endian);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5846 CODING_UTF_16_ENDIAN (coding) = (EQ (val, Qbig) ? utf_16_big_endian
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5847 : utf_16_little_endian);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
5848 CODING_UTF_16_SURROGATE (coding) = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5849 coding->detector = detect_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5850 coding->decoder = decode_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5851 coding->encoder = encode_coding_utf_16;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5852 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5853 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5854 if (CODING_UTF_16_BOM (coding) == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5855 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5856 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5857 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5858 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5859 coding->detector = detect_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5860 coding->decoder = decode_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5861 coding->encoder = encode_coding_ccl;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5862 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5863 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5864 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5865 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5866 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5867 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5868 coding->detector = detect_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5869 coding->decoder = decode_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5870 coding->encoder = encode_coding_emacs_mule;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5871 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5872 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5873 coding->spec.emacs_mule.full_support = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5874 if (! NILP (AREF (attrs, coding_attr_emacs_mule_full))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5875 && ! EQ (CODING_ATTR_CHARSET_LIST (attrs), Vemacs_mule_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5876 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5877 Lisp_Object tail, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5878 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5879
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5880 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5881 tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5882 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5883 max_charset_id = XFASTINT (XCAR (tail));
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5884 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5885 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5886 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5887 tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5888 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5889 coding->max_charset_id = max_charset_id;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5890 coding->safe_charsets = SDATA (safe_charsets);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5891 coding->spec.emacs_mule.full_support = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5892 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5893 coding->spec.emacs_mule.cmp_status.state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5894 coding->spec.emacs_mule.cmp_status.method = COMPOSITION_NO;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5895 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5896 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5897 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5898 coding->detector = detect_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5899 coding->decoder = decode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5900 coding->encoder = encode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5901 coding->common_flags
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5902 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5903 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5904 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5905 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5906 coding->detector = detect_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5907 coding->decoder = decode_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5908 coding->encoder = encode_coding_big5;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5909 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5910 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5911 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5912 else /* EQ (coding_type, Qraw_text) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5913 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5914 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5915 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5916 coding->encoder = encode_coding_raw_text;
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5917 if (! EQ (eol_type, Qunix))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5918 {
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5919 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5920 if (! VECTORP (eol_type))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5921 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5922 }
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5923
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5924 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5925
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5926 return;
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5927 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5928
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5929 /* Return a list of charsets supported by CODING. */
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5930
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5931 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5932 coding_charset_list (struct coding_system *coding)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5933 {
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
5934 Lisp_Object attrs, charset_list;
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5935
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5936 CODING_GET_INFO (coding, attrs, charset_list);
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5937 if (EQ (CODING_ATTR_TYPE (attrs), Qiso_2022))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5938 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5939 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5940
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5941 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5942 charset_list = Viso_2022_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5943 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5944 else if (EQ (CODING_ATTR_TYPE (attrs), Qemacs_mule))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5945 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5946 charset_list = Vemacs_mule_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5947 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5948 return charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5949 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5950
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5951
101776
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5952 /* Return a list of charsets supported by CODING-SYSTEM. */
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5953
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5954 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5955 coding_system_charset_list (Lisp_Object coding_system)
101776
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5956 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5957 int id;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5958 Lisp_Object attrs, charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5959
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5960 CHECK_CODING_SYSTEM_GET_ID (coding_system, id);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5961 attrs = CODING_ID_ATTRS (id);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5962
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5963 if (EQ (CODING_ATTR_TYPE (attrs), Qiso_2022))
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5964 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5965 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5966
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5967 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5968 charset_list = Viso_2022_charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5969 else
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5970 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5971 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5972 else if (EQ (CODING_ATTR_TYPE (attrs), Qemacs_mule))
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5973 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5974 charset_list = Vemacs_mule_charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5975 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5976 else
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5977 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5978 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5979 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5980 return charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5981 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5982
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5983
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5984 /* Return raw-text or one of its subsidiaries that has the same
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5985 eol_type as CODING-SYSTEM. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5986
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5987 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
5988 raw_text_coding_system (Lisp_Object coding_system)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5989 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
5990 Lisp_Object spec, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5991 Lisp_Object eol_type, raw_text_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5992
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5993 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5994 return Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5995 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5996 attrs = AREF (spec, 0);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5997
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5998 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5999 return coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6001 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6002 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6003 return Qraw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6004 spec = CODING_SYSTEM_SPEC (Qraw_text);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6005 raw_text_eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6006 return (EQ (eol_type, Qunix) ? AREF (raw_text_eol_type, 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6007 : EQ (eol_type, Qdos) ? AREF (raw_text_eol_type, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6008 : AREF (raw_text_eol_type, 2));
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6009 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6010
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6011
110834
b997f43af473 Fix complementing of a coding system
Kenichi Handa <handa@m17n.org>
parents: 110829
diff changeset
6012 /* If CODING_SYSTEM doesn't specify end-of-line format, return one of
b997f43af473 Fix complementing of a coding system
Kenichi Handa <handa@m17n.org>
parents: 110829
diff changeset
6013 the subsidiary that has the same eol-spec as PARENT (if it is not
b997f43af473 Fix complementing of a coding system
Kenichi Handa <handa@m17n.org>
parents: 110829
diff changeset
6014 nil and specifies end-of-line format) or the system's setting
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6015 (system_eol_type). */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6016
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6017 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6018 coding_inherit_eol_type (Lisp_Object coding_system, Lisp_Object parent)
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6019 {
89545
4f394eed6ff2 (inhibit_pre_post_conversion): Removed (unused).
Dave Love <fx@gnu.org>
parents: 89519
diff changeset
6020 Lisp_Object spec, eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6021
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6022 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6023 coding_system = Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6024 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6025 eol_type = AREF (spec, 2);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6026 if (VECTORP (eol_type))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6027 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6028 Lisp_Object parent_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6029
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6030 if (! NILP (parent))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6031 {
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6032 Lisp_Object parent_spec;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6033
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
6034 parent_spec = CODING_SYSTEM_SPEC (parent);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6035 parent_eol_type = AREF (parent_spec, 2);
110834
b997f43af473 Fix complementing of a coding system
Kenichi Handa <handa@m17n.org>
parents: 110829
diff changeset
6036 if (VECTORP (parent_eol_type))
110855
bec49af30c2f Merge changes from emacs-23 branch.
Juanma Barranquero <lekktu@gmail.com>
parents: 110357 110847
diff changeset
6037 parent_eol_type = system_eol_type;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6038 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6039 else
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6040 parent_eol_type = system_eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6041 if (EQ (parent_eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6042 coding_system = AREF (eol_type, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6043 else if (EQ (parent_eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6044 coding_system = AREF (eol_type, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6045 else if (EQ (parent_eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6046 coding_system = AREF (eol_type, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6047 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6048 return coding_system;
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6049 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6050
110829
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6051
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6052 /* Check if text-conversion and eol-conversion of CODING_SYSTEM are
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6053 decided for writing to a process. If not, complement them, and
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6054 return a new coding system. */
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6055
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6056 Lisp_Object
110855
bec49af30c2f Merge changes from emacs-23 branch.
Juanma Barranquero <lekktu@gmail.com>
parents: 110357 110847
diff changeset
6057 complement_process_encoding_system (Lisp_Object coding_system)
110829
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6058 {
110845
394a9ff3e3cf coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110834
diff changeset
6059 Lisp_Object coding_base = Qnil, eol_base = Qnil;
394a9ff3e3cf coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110834
diff changeset
6060 Lisp_Object spec, attrs;
110847
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6061 int i;
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6062
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6063 for (i = 0; i < 3; i++)
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6064 {
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6065 if (i == 1)
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6066 coding_system = CDR_SAFE (Vdefault_process_coding_system);
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6067 else if (i == 2)
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6068 coding_system = preferred_coding_system ();
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6069 spec = CODING_SYSTEM_SPEC (coding_system);
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6070 if (NILP (spec))
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6071 continue;
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6072 attrs = AREF (spec, 0);
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6073 if (NILP (coding_base) && ! EQ (CODING_ATTR_TYPE (attrs), Qundecided))
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6074 coding_base = CODING_ATTR_BASE_NAME (attrs);
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6075 if (NILP (eol_base) && ! VECTORP (AREF (spec, 2)))
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6076 eol_base = coding_system;
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6077 if (! NILP (coding_base) && ! NILP (eol_base))
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6078 break;
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6079 }
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6080
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6081 if (i > 0)
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6082 /* The original CODING_SYSTEM didn't specify text-conversion or
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6083 eol-conversion. Be sure that we return a fully complemented
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6084 coding system. */
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6085 coding_system = coding_inherit_eol_type (coding_base, eol_base);
c234b2db847c coding.c (complement_process_encoding_system): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 110845
diff changeset
6086 return coding_system;
110829
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6087 }
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6088
4d672e9d91bf Complement a coding system for encoding arguments and input to a process.
Kenichi Handa <handa@m17n.org>
parents: 110336
diff changeset
6089
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6090 /* Emacs has a mechanism to automatically detect a coding system if it
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6091 is one of Emacs' internal format, ISO2022, SJIS, and BIG5. But,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6092 it's impossible to distinguish some coding systems accurately
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6093 because they use the same range of codes. So, at first, coding
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6094 systems are categorized into 7, those are:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6095
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
6096 o coding-category-emacs-mule
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6097
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6098 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6099 as Emacs' internal format. Assigned the coding-system (Lisp
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
6100 symbol) `emacs-mule' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6101
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6102 o coding-category-sjis
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6103
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6104 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6105 as SJIS. Assigned the coding-system (Lisp
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6106 symbol) `japanese-shift-jis' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6107
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6108 o coding-category-iso-7
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6109
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6110 The category for a coding system which has the same code range
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6111 as ISO2022 of 7-bit environment. This doesn't use any locking
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6112 shift and single shift functions. This can encode/decode all
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6113 charsets. Assigned the coding-system (Lisp symbol)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6114 `iso-2022-7bit' by default.
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6115
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6116 o coding-category-iso-7-tight
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6117
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6118 Same as coding-category-iso-7 except that this can
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6119 encode/decode only the specified charsets.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6120
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6121 o coding-category-iso-8-1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6122
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6123 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6124 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6125 for DIMENSION1 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6126 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6127 symbol) `iso-latin-1' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6128
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6129 o coding-category-iso-8-2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6130
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6131 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6132 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6133 for DIMENSION2 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6134 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6135 symbol) `japanese-iso-8bit' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6136
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6137 o coding-category-iso-7-else
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6138
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6139 The category for a coding system which has the same code range
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
6140 as ISO2022 of 7-bit environment but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6141 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6142 symbol) `iso-2022-7bit-lock' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6143
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6144 o coding-category-iso-8-else
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6145
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6146 The category for a coding system which has the same code range
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
6147 as ISO2022 of 8-bit environment but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6148 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6149 symbol) `iso-2022-8bit-ss2' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6150
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6151 o coding-category-big5
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6152
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6153 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6154 as BIG5. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
6155 `cn-big5' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6156
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6157 o coding-category-utf-8
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6158
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6159 The category for a coding system which has the same code range
54303
5256a4b9366f UTF-8 is now RFC3629.
Eli Zaretskii <eliz@gnu.org>
parents: 53775
diff changeset
6160 as UTF-8 (cf. RFC3629). Assigned the coding-system (Lisp
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6161 symbol) `utf-8' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6162
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6163 o coding-category-utf-16-be
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6164
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6165 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6166 Unicode signature (cf. Unicode Standard) in the order of BIG
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6167 endian at the head. Assigned the coding-system (Lisp symbol)
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6168 `utf-16-be' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6169
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6170 o coding-category-utf-16-le
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6171
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6172 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6173 Unicode signature (cf. Unicode Standard) in the order of
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6174 LITTLE endian at the head. Assigned the coding-system (Lisp
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6175 symbol) `utf-16-le' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6176
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6177 o coding-category-ccl
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6178
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6179 The category for a coding system of which encoder/decoder is
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6180 written in CCL programs. The default value is nil, i.e., no
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6181 coding system is assigned.
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6182
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6183 o coding-category-binary
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6184
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6185 The category for a coding system not categorized in any of the
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6186 above. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
6187 `no-conversion' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6188
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6189 Each of them is a Lisp symbol and the value is an actual
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6190 `coding-system's (this is also a Lisp symbol) assigned by a user.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6191 What Emacs does actually is to detect a category of coding system.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6192 Then, it uses a `coding-system' assigned to it. If Emacs can't
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6193 decide only one possible category, it selects a category of the
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6194 highest priority. Priorities of categories are also specified by a
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6195 user in a Lisp variable `coding-category-list'.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6196
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6197 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6198
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6199 #define EOL_SEEN_NONE 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6200 #define EOL_SEEN_LF 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6201 #define EOL_SEEN_CR 2
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6202 #define EOL_SEEN_CRLF 4
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6203
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6204 /* Detect how end-of-line of a text of length SRC_BYTES pointed by
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6205 SOURCE is encoded. If CATEGORY is one of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6206 coding_category_utf_16_XXXX, assume that CR and LF are encoded by
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6207 two-byte, else they are encoded by one-byte.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6208
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6209 Return one of EOL_SEEN_XXX. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6210
19173
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
6211 #define MAX_EOL_CHECK_COUNT 3
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
6212
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6213 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
6214 detect_eol (const unsigned char *source, EMACS_INT src_bytes,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
6215 enum coding_category category)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6216 {
84646
922a7e3b7383 (detect_eol_type, detect_eol_type_in_2_octet_form):
Michaël Cadilhac <michael.cadilhac@lrde.org>
parents: 83648
diff changeset
6217 const unsigned char *src = source, *src_end = src + src_bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6218 unsigned char c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6219 int total = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6220 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6221
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6222 if ((1 << category) & CATEGORY_MASK_UTF_16)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6223 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6224 int msb, lsb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6225
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6226 msb = category == (coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6227 | coding_category_utf_16_le_nosig);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6228 lsb = 1 - msb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6229
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6230 while (src + 1 < src_end)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6231 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6232 c = src[lsb];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6233 if (src[msb] == 0 && (c == '\n' || c == '\r'))
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6234 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6235 int this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6236
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6237 if (c == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6238 this_eol = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6239 else if (src + 3 >= src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6240 || src[msb + 2] != 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6241 || src[lsb + 2] != '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6242 this_eol = EOL_SEEN_CR;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6243 else
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6244 {
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6245 this_eol = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6246 src += 2;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6247 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6248
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6249 if (eol_seen == EOL_SEEN_NONE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6250 /* This is the first end-of-line. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6251 eol_seen = this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6252 else if (eol_seen != this_eol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6253 {
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6254 /* The found type is different from what found before.
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6255 Allow for stray ^M characters in DOS EOL files. */
111997
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6256 if ((eol_seen == EOL_SEEN_CR && this_eol == EOL_SEEN_CRLF)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6257 || (eol_seen == EOL_SEEN_CRLF
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6258 && this_eol == EOL_SEEN_CR))
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6259 eol_seen = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6260 else
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6261 {
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6262 eol_seen = EOL_SEEN_LF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6263 break;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6264 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6265 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6266 if (++total == MAX_EOL_CHECK_COUNT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6267 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6268 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6269 src += 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6270 }
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6271 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6272 else
111997
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6273 while (src < src_end)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6274 {
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6275 c = *src++;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6276 if (c == '\n' || c == '\r')
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6277 {
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6278 int this_eol;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6279
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6280 if (c == '\n')
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6281 this_eol = EOL_SEEN_LF;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6282 else if (src >= src_end || *src != '\n')
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6283 this_eol = EOL_SEEN_CR;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6284 else
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6285 this_eol = EOL_SEEN_CRLF, src++;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6286
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6287 if (eol_seen == EOL_SEEN_NONE)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6288 /* This is the first end-of-line. */
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6289 eol_seen = this_eol;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6290 else if (eol_seen != this_eol)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6291 {
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6292 /* The found type is different from what found before.
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6293 Allow for stray ^M characters in DOS EOL files. */
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6294 if ((eol_seen == EOL_SEEN_CR && this_eol == EOL_SEEN_CRLF)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6295 || (eol_seen == EOL_SEEN_CRLF && this_eol == EOL_SEEN_CR))
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6296 eol_seen = EOL_SEEN_CRLF;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6297 else
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6298 {
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6299 eol_seen = EOL_SEEN_LF;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6300 break;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6301 }
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6302 }
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6303 if (++total == MAX_EOL_CHECK_COUNT)
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6304 break;
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6305 }
a5a188ddc758 Minor clean up to silence some gcc warnings.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 111779
diff changeset
6306 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6307 return eol_seen;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6308 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6309
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6310
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6311 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6312 adjust_coding_eol_type (struct coding_system *coding, int eol_seen)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6313 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
6314 Lisp_Object eol_type;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6315
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6316 eol_type = CODING_ID_EOL_TYPE (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6317 if (eol_seen & EOL_SEEN_LF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6318 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6319 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 0));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6320 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6321 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
6322 else if (eol_seen & EOL_SEEN_CRLF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6323 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6324 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 1));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6325 eol_type = Qdos;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6326 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
6327 else if (eol_seen & EOL_SEEN_CR)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6328 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6329 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 2));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6330 eol_type = Qmac;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6331 }
19181
917138730635 (detect_eol_type): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 19173
diff changeset
6332 return eol_type;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6333 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6334
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6335 /* Detect how a text specified in CODING is encoded. If a coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6336 system is detected, update fields of CODING by the detected coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6337 system. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6338
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6339 void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6340 detect_coding (struct coding_system *coding)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6341 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6342 const unsigned char *src, *src_end;
102105
a5023e8bbb1e (detect_coding): Preserve coding->mode.
Kenichi Handa <handa@m17n.org>
parents: 102058
diff changeset
6343 int saved_mode = coding->mode;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6344
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6345 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6346 coding->produced = coding->produced_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6347 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6348
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6349 src_end = coding->source + coding->src_bytes;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6350 coding->head_ascii = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6351
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6352 /* If we have not yet decided the text encoding type, detect it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6353 now. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6354 if (EQ (CODING_ATTR_TYPE (CODING_ID_ATTRS (coding->id)), Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6355 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6356 int c, i;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6357 struct coding_detection_info detect_info;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6358 int null_byte_found = 0, eight_bit_found = 0;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6359
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6360 detect_info.checked = detect_info.found = detect_info.rejected = 0;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6361 for (src = coding->source; src < src_end; src++)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6362 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6363 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6364 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6365 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6366 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6367 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6368 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6369 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6370 else if (c < 0x20)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6371 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6372 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6373 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6374 && ! detect_info.checked)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6375 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6376 if (detect_coding_iso_2022 (coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6377 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6378 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6379 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6380 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6381 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6382 have found a null-byte, but it's very
107984
bef5d1738c0b Make variable forwarding explicit rather the using special values.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 107507
diff changeset
6383 rare that a binary file conforms to
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6384 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6385 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6386 coding->head_ascii = src - coding->source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6387 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6388 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6389 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6390 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6391 }
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
6392 else if (! c && !inhibit_null_byte_detection)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6393 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6394 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6395 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6396 break;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6397 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6398 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6399 coding->head_ascii++;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6400 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6401 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6402 coding->head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6403 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6404
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6405 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6406 || coding->head_ascii < coding->src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6407 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6408 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6409 enum coding_category category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6410 struct coding_system *this;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6411
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6412 if (coding->head_ascii == coding->src_bytes)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6413 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6414 for (i = 0; i < coding_category_raw_text; i++)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6415 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6416 category = coding_priorities[i];
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6417 this = coding_categories + category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6418 if (detect_info.found & (1 << category))
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6419 break;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6420 }
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6421 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6422 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6423 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6424 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6425 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6426 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6427 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6428 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6429 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6430 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6431 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6432 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6433 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6434 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6435 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6436 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6437 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6438 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6439 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6440 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6441 if (detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6442 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6443 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6444 else if ((*(this->detector)) (coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6445 && detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6446 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6447 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6448 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6449 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6450 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6451 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6452 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6453 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6454 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6455 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6456 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6457 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6458
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6459 if (i < coding_category_raw_text)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6460 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6461 else if (null_byte_found)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6462 setup_coding_system (Qno_conversion, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6463 else if ((detect_info.rejected & CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6464 == CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6465 setup_coding_system (Qraw_text, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6466 else if (detect_info.rejected)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6467 for (i = 0; i < coding_category_raw_text; i++)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6468 if (! (detect_info.rejected & (1 << coding_priorities[i])))
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6469 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6470 this = coding_categories + coding_priorities[i];
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6471 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6472 break;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6473 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6474 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6475 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6476 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6477 == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6478 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6479 Lisp_Object coding_systems;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6480 struct coding_detection_info detect_info;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6481
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6482 coding_systems
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6483 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6484 detect_info.found = detect_info.rejected = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6485 coding->head_ascii = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6486 if (CONSP (coding_systems)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6487 && detect_coding_utf_8 (coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6488 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6489 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6490 setup_coding_system (XCAR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6491 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6492 setup_coding_system (XCDR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6493 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6494 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6495 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6496 == coding_category_utf_16_auto)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6497 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6498 Lisp_Object coding_systems;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6499 struct coding_detection_info detect_info;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6500
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6501 coding_systems
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6502 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6503 detect_info.found = detect_info.rejected = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6504 coding->head_ascii = 0;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6505 if (CONSP (coding_systems)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6506 && detect_coding_utf_16 (coding, &detect_info))
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6507 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6508 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6509 setup_coding_system (XCAR (coding_systems), coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6510 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6511 setup_coding_system (XCDR (coding_systems), coding);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6512 }
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6513 }
102105
a5023e8bbb1e (detect_coding): Preserve coding->mode.
Kenichi Handa <handa@m17n.org>
parents: 102058
diff changeset
6514 coding->mode = saved_mode;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6515 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6516
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6517
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6518 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6519 decode_eol (struct coding_system *coding)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6520 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6521 Lisp_Object eol_type;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6522 unsigned char *p, *pbeg, *pend;
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
6523
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6524 eol_type = CODING_ID_EOL_TYPE (coding->id);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
6525 if (EQ (eol_type, Qunix) || inhibit_eol_conversion)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6526 return;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6527
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6528 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6529 pbeg = coding->destination;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6530 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6531 pbeg = BYTE_POS_ADDR (coding->dst_pos_byte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6532 pend = pbeg + coding->produced;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6533
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6534 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6535 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6536 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6537
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6538 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6539 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6540 if (*p == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6541 eol_seen |= EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6542 else if (*p == '\r')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6543 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6544 if (p + 1 < pend && *(p + 1) == '\n')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6545 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6546 eol_seen |= EOL_SEEN_CRLF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6547 p++;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6548 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6549 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6550 eol_seen |= EOL_SEEN_CR;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6551 }
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6552 }
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6553 /* Handle DOS-style EOLs in a file with stray ^M characters. */
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6554 if ((eol_seen & EOL_SEEN_CRLF) != 0
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6555 && (eol_seen & EOL_SEEN_CR) != 0
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6556 && (eol_seen & EOL_SEEN_LF) == 0)
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6557 eol_seen = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6558 else if (eol_seen != EOL_SEEN_NONE
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6559 && eol_seen != EOL_SEEN_LF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6560 && eol_seen != EOL_SEEN_CRLF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6561 && eol_seen != EOL_SEEN_CR)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6562 eol_seen = EOL_SEEN_LF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6563 if (eol_seen != EOL_SEEN_NONE)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6564 eol_type = adjust_coding_eol_type (coding, eol_seen);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6565 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6566
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6567 if (EQ (eol_type, Qmac))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6568 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6569 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6570 if (*p == '\r')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6571 *p = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6572 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6573 else if (EQ (eol_type, Qdos))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6574 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6575 int n = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6576
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6577 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6578 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6579 /* Start deleting '\r' from the tail to minimize the memory
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6580 movement. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6581 for (p = pend - 2; p >= pbeg; p--)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6582 if (*p == '\r')
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6583 {
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
6584 memmove (p, p + 1, pend-- - p - 1);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6585 n++;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6586 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6587 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6588 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6589 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6590 int pos_byte = coding->dst_pos_byte;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6591 int pos = coding->dst_pos;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6592 int pos_end = pos + coding->produced_char - 1;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6593
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6594 while (pos < pos_end)
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6595 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6596 p = BYTE_POS_ADDR (pos_byte);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6597 if (*p == '\r' && p[1] == '\n')
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6598 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6599 del_range_2 (pos, pos_byte, pos + 1, pos_byte + 1, 0);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6600 n++;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6601 pos_end--;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6602 }
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6603 pos++;
91535
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6604 if (coding->dst_multibyte)
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6605 pos_byte += BYTES_BY_CHAR_HEAD (*p);
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6606 else
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6607 pos_byte++;
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6608 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6609 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6610 coding->produced -= n;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6611 coding->produced_char -= n;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6612 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6613 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6614
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6615
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6616 /* Return a translation table (or list of them) from coding system
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6617 attribute vector ATTRS for encoding (ENCODEP is nonzero) or
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6618 decoding (ENCODEP is zero). */
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6619
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6620 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6621 get_translation_table (Lisp_Object attrs, int encodep, int *max_lookup)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6622 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6623 Lisp_Object standard, translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6624 Lisp_Object val;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6625
103306
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6626 if (NILP (Venable_character_translation))
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6627 {
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6628 if (max_lookup)
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6629 *max_lookup = 0;
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6630 return Qnil;
3680b4fe0f79 * coding.c (get_translation_table): Check Venable_character_translation.
Chong Yidong <cyd@stupidchicken.com>
parents: 103133
diff changeset
6631 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6632 if (encodep)
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6633 translation_table = CODING_ATTR_ENCODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6634 standard = Vstandard_translation_table_for_encode;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6635 else
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6636 translation_table = CODING_ATTR_DECODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6637 standard = Vstandard_translation_table_for_decode;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6638 if (NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6639 translation_table = standard;
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6640 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6641 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6642 if (SYMBOLP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6643 translation_table = Fget (translation_table, Qtranslation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6644 else if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6645 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6646 translation_table = Fcopy_sequence (translation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6647 for (val = translation_table; CONSP (val); val = XCDR (val))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6648 if (SYMBOLP (XCAR (val)))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6649 XSETCAR (val, Fget (XCAR (val), Qtranslation_table));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6650 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6651 if (CHAR_TABLE_P (standard))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6652 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6653 if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6654 translation_table = nconc2 (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6655 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6656 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6657 translation_table = Fcons (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6658 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6659 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6660 }
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6661
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6662 if (max_lookup)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6663 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6664 *max_lookup = 1;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6665 if (CHAR_TABLE_P (translation_table)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6666 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (translation_table)) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6667 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6668 val = XCHAR_TABLE (translation_table)->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6669 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6670 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6671 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6672 else if (CONSP (translation_table))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6673 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6674 Lisp_Object tail, val;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6675
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6676 for (tail = translation_table; CONSP (tail); tail = XCDR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6677 if (CHAR_TABLE_P (XCAR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6678 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (XCAR (tail))) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6679 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6680 val = XCHAR_TABLE (XCAR (tail))->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6681 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6682 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6683 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6684 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6685 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6686 return translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6687 }
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6688
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6689 #define LOOKUP_TRANSLATION_TABLE(table, c, trans) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6690 do { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6691 trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6692 if (CHAR_TABLE_P (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6693 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6694 trans = CHAR_TABLE_REF (table, c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6695 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6696 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6697 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6698 else if (CONSP (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6699 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6700 Lisp_Object tail; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6701 \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6702 for (tail = table; CONSP (tail); tail = XCDR (tail)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6703 if (CHAR_TABLE_P (XCAR (tail))) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6704 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6705 trans = CHAR_TABLE_REF (XCAR (tail), c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6706 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6707 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6708 else if (! NILP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6709 break; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6710 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6711 } \
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6712 } while (0)
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6713
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6714
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6715 /* Return a translation of character(s) at BUF according to TRANS.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6716 TRANS is TO-CHAR or ((FROM . TO) ...) where
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6717 FROM = [FROM-CHAR ...], TO is TO-CHAR or [TO-CHAR ...].
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6718 The return value is TO-CHAR or ([FROM-CHAR ...] . TO) if a
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6719 translation is found, and Qnil if not found..
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6720 If BUF is too short to lookup characters in FROM, return Qt. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6721
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6722 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6723 get_translation (Lisp_Object trans, int *buf, int *buf_end)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6724 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6725
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6726 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6727 return trans;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6728 for (; CONSP (trans); trans = XCDR (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6729 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6730 Lisp_Object val = XCAR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6731 Lisp_Object from = XCAR (val);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6732 int len = ASIZE (from);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6733 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6734
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6735 for (i = 0; i < len; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6736 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6737 if (buf + i == buf_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6738 return Qt;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6739 if (XINT (AREF (from, i)) != buf[i])
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6740 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6741 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6742 if (i == len)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6743 return val;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6744 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6745 return Qnil;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6746 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6747
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6748
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6749 static int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
6750 produce_chars (struct coding_system *coding, Lisp_Object translation_table,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
6751 int last_block)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6752 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6753 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6754 unsigned char *dst_end = coding->destination + coding->dst_bytes;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6755 EMACS_INT produced;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6756 EMACS_INT produced_chars = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6757 int carryover = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6758
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6759 if (! coding->chars_at_source)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6760 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6761 /* Source characters are in coding->charbuf. */
89575
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6762 int *buf = coding->charbuf;
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6763 int *buf_end = buf + coding->charbuf_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6764
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6765 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6766 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6767 coding_set_source (coding);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6768 dst_end = ((unsigned char *) coding->source) + coding->consumed;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6769 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6770
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6771 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6772 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6773 int c = *buf, i;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6774
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6775 if (c >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6776 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6777 int from_nchars = 1, to_nchars = 1;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6778 Lisp_Object trans = Qnil;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6779
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6780 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6781 if (! NILP (trans))
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6782 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6783 trans = get_translation (trans, buf, buf_end);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6784 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6785 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6786 else if (CONSP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6787 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6788 from_nchars = ASIZE (XCAR (trans));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6789 trans = XCDR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6790 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6791 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6792 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6793 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6794 to_nchars = ASIZE (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6795 c = XINT (AREF (trans, 0));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6796 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6797 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6798 else if (EQ (trans, Qt) && ! last_block)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6799 break;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6800 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6801
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6802 if (dst + MAX_MULTIBYTE_LENGTH * to_nchars > dst_end)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6803 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6804 dst = alloc_destination (coding,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6805 buf_end - buf
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6806 + MAX_MULTIBYTE_LENGTH * to_nchars,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6807 dst);
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6808 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6809 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6810 coding_set_source (coding);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6811 dst_end = (((unsigned char *) coding->source)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6812 + coding->consumed);
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6813 }
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6814 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6815 dst_end = coding->destination + coding->dst_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6816 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6817
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6818 for (i = 0; i < to_nchars; i++)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6819 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6820 if (i > 0)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6821 c = XINT (AREF (trans, i));
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6822 if (coding->dst_multibyte
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6823 || ! CHAR_BYTE8_P (c))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6824 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6825 else
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6826 *dst++ = CHAR_TO_BYTE8 (c);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6827 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6828 produced_chars += to_nchars;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6829 buf += from_nchars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6830 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6831 else
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6832 /* This is an annotation datum. (-C) is the length. */
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6833 buf += -c;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6834 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6835 carryover = buf_end - buf;
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6836 }
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6837 else
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6838 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6839 /* Source characters are at coding->source. */
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6840 const unsigned char *src = coding->source;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6841 const unsigned char *src_end = src + coding->consumed;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6842
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6843 if (EQ (coding->dst_object, coding->src_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6844 dst_end = (unsigned char *) src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6845 if (coding->src_multibyte != coding->dst_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6846 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6847 if (coding->src_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6848 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6849 int multibytep = 1;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
6850 EMACS_INT consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6851
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6852 while (1)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6853 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6854 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6855 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6856
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6857 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6858 if (dst == dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6859 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6860 if (EQ (coding->src_object, coding->dst_object))
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6861 dst_end = (unsigned char *) src;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6862 if (dst == dst_end)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6863 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6864 EMACS_INT offset = src - coding->source;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6865
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6866 dst = alloc_destination (coding, src_end - src + 1,
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6867 dst);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6868 dst_end = coding->destination + coding->dst_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6869 coding_set_source (coding);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6870 src = coding->source + offset;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6871 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6872 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6873 dst_end = (unsigned char *) src;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6874 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6875 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6876 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6877 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6878 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6879 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6880 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6881 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6882 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6883 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6884 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6885 int multibytep = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6886 int c = *src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6887
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6888 if (dst >= dst_end - 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6889 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6890 if (EQ (coding->src_object, coding->dst_object))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6891 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6892 if (dst >= dst_end - 1)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6893 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6894 EMACS_INT offset = src - coding->source;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6895 EMACS_INT more_bytes;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6896
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6897 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6898 more_bytes = ((src_end - src) / 2) + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6899 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6900 more_bytes = src_end - src + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6901 dst = alloc_destination (coding, more_bytes, dst);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6902 dst_end = coding->destination + coding->dst_bytes;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6903 coding_set_source (coding);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6904 src = coding->source + offset;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6905 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6906 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6907 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6908 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6909 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6910 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6911 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6912 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6913 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6914 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6915 if (!EQ (coding->src_object, coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6916 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6917 EMACS_INT require = coding->src_bytes - coding->dst_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6918
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6919 if (require > 0)
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6920 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6921 EMACS_INT offset = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6922
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6923 dst = alloc_destination (coding, require, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6924 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6925 src = coding->source + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6926 src_end = coding->source + coding->src_bytes;
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6927 }
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6928 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6929 produced_chars = coding->consumed_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6930 while (src < src_end)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
6931 *dst++ = *src++;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6932 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6933 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6934
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6935 produced = dst - (coding->destination + coding->produced);
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
6936 if (BUFFERP (coding->dst_object) && produced_chars > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6937 insert_from_gap (produced_chars, produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6938 coding->produced += produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6939 coding->produced_char += produced_chars;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6940 return carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6941 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6942
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6943 /* Compose text in CODING->object according to the annotation data at
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6944 CHARBUF. CHARBUF is an array:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6945 [ -LENGTH ANNOTATION_MASK NCHARS NBYTES METHOD [ COMPONENTS... ] ]
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6946 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6947
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6948 static INLINE void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6949 produce_composition (struct coding_system *coding, int *charbuf, EMACS_INT pos)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6950 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6951 int len;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6952 EMACS_INT to;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6953 enum composition_method method;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6954 Lisp_Object components;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6955
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6956 len = -charbuf[0] - MAX_ANNOTATION_LENGTH;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6957 to = pos + charbuf[2];
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6958 method = (enum composition_method) (charbuf[4]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6959
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6960 if (method == COMPOSITION_RELATIVE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6961 components = Qnil;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6962 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6963 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6964 Lisp_Object args[MAX_COMPOSITION_COMPONENTS * 2 - 1];
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6965 int i, j;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6966
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6967 if (method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6968 len = charbuf[2] * 3 - 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6969 charbuf += MAX_ANNOTATION_LENGTH;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6970 /* charbuf = [ CHRA ... CHAR] or [ CHAR -2 RULE ... CHAR ] */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6971 for (i = j = 0; i < len && charbuf[i] != -1; i++, j++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6972 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6973 if (charbuf[i] >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6974 args[j] = make_number (charbuf[i]);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6975 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6976 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6977 i++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6978 args[j] = make_number (charbuf[i] % 0x100);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6979 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6980 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6981 components = (i == j ? Fstring (j, args) : Fvector (j, args));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6982 }
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6983 compose_text (pos, to, components, Qnil, coding->dst_object);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6984 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6985
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6986
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6987 /* Put `charset' property on text in CODING->object according to
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6988 the annotation data at CHARBUF. CHARBUF is an array:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6989 [ -LENGTH ANNOTATION_MASK NCHARS CHARSET-ID ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6990 */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6991
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6992 static INLINE void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
6993 produce_charset (struct coding_system *coding, int *charbuf, EMACS_INT pos)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6994 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6995 EMACS_INT from = pos - charbuf[2];
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6996 struct charset *charset = CHARSET_FROM_ID (charbuf[3]);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6997
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6998 Fput_text_property (make_number (from), make_number (pos),
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6999 Qcharset, CHARSET_NAME (charset),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7000 coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7001 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7002
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7003
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7004 #define CHARBUF_SIZE 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7005
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7006 #define ALLOC_CONVERSION_WORK_AREA(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7007 do { \
101943
97c9e9322753 Remove spurious semicolons.
Juanma Barranquero <lekktu@gmail.com>
parents: 101904
diff changeset
7008 int size = CHARBUF_SIZE; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7009 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7010 coding->charbuf = NULL; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7011 while (size > 1024) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7012 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7013 coding->charbuf = (int *) alloca (sizeof (int) * size); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7014 if (coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7015 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7016 size >>= 1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7017 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7018 if (! coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7019 { \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7020 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_MEM); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7021 return coding->result; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7022 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7023 coding->charbuf_size = size; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7024 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7025
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7026
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
7027 static void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7028 produce_annotation (struct coding_system *coding, EMACS_INT pos)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7029 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7030 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7031 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7032
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7033 if (NILP (coding->dst_object))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7034 return;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7035
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7036 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7037 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7038 if (*charbuf >= 0)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7039 pos++, charbuf++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7040 else
29877
7b43e1fb478a (decode_eol_post_ccl): Special handling for undecided
Eli Zaretskii <eliz@gnu.org>
parents: 29725
diff changeset
7041 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7042 int len = -*charbuf;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7043
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7044 if (len > 2)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7045 switch (charbuf[1])
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7046 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7047 case CODING_ANNOTATE_COMPOSITION_MASK:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7048 produce_composition (coding, charbuf, pos);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7049 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7050 case CODING_ANNOTATE_CHARSET_MASK:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7051 produce_charset (coding, charbuf, pos);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7052 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7053 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7054 charbuf += len;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7055 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7056 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7057 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7058
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7059 /* Decode the data at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7060 CODING->src_object is a buffer, a string, or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7061 CODING->dst_object is a buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7062
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7063 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7064 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7065 the source text in the buffer, otherwise, the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7066 gap area of the buffer, and CODING->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7067 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7068 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7069 negative.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7070
90380
4bf7966e0788 (decode_coding): Typo in comment fixed.
Kenichi Handa <handa@m17n.org>
parents: 90378
diff changeset
7071 If CODING->src_object is a string, CODING->src_pos is an index to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7072 that string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7073
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7074 If CODING->src_object is nil, CODING->source must already point to
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7075 the non-relocatable memory area. In this case, CODING->src_pos is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7076 an offset from CODING->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7077
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7078 The decoded data is inserted at the current point of the buffer
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7079 CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7080 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7081
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7082 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7083 decode_coding (struct coding_system *coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7084 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7085 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7086 Lisp_Object undo_list;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
7087 Lisp_Object translation_table;
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7088 struct ccl_spec cclspec;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7089 int carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7090 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7091
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7092 if (BUFFERP (coding->src_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7093 && coding->src_pos > 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7094 && coding->src_pos < GPT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7095 && coding->src_pos + coding->src_chars > GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7096 move_gap_both (coding->src_pos, coding->src_pos_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7097
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7098 undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7099 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7100 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7101 if (current_buffer != XBUFFER (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7102 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7103 if (GPT != PT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7104 move_gap_both (PT, PT_BYTE);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7105 undo_list = current_buffer->undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7106 current_buffer->undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7107 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7108
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7109 coding->consumed = coding->consumed_char = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7110 coding->produced = coding->produced_char = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7111 coding->chars_at_source = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7112 record_conversion_result (coding, CODING_RESULT_SUCCESS);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7113 coding->errors = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7114
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7115 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7116
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7117 attrs = CODING_ID_ATTRS (coding->id);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
7118 translation_table = get_translation_table (attrs, 0, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7119
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7120 carryover = 0;
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7121 if (coding->decoder == decode_coding_ccl)
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7122 {
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7123 coding->spec.ccl = &cclspec;
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7124 setup_ccl_program (&cclspec.ccl, CODING_CCL_DECODER (coding));
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7125 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7126 do
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7127 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7128 EMACS_INT pos = coding->dst_pos + coding->produced_char;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7129
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7130 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7131 coding->annotated = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7132 coding->charbuf_used = carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7133 (*(coding->decoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7134 coding_set_destination (coding);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7135 carryover = produce_chars (coding, translation_table, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7136 if (coding->annotated)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7137 produce_annotation (coding, pos);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7138 for (i = 0; i < carryover; i++)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7139 coding->charbuf[i]
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7140 = coding->charbuf[coding->charbuf_used - carryover + i];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7141 }
107171
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7142 while (coding->result == CODING_RESULT_INSUFFICIENT_DST
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7143 || (coding->consumed < coding->src_bytes
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7144 && (coding->result == CODING_RESULT_SUCCESS
dfc03b454687 Fix the ccl decoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 106918
diff changeset
7145 || coding->result == CODING_RESULT_INVALID_SRC)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7146
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7147 if (carryover > 0)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7148 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7149 coding_set_destination (coding);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7150 coding->charbuf_used = carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7151 produce_chars (coding, translation_table, 1);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7152 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7153
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7154 coding->carryover_bytes = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7155 if (coding->consumed < coding->src_bytes)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7156 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7157 int nbytes = coding->src_bytes - coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7158 const unsigned char *src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7159
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7160 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7161 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7162 src = coding->source + coding->consumed;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7163
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7164 if (coding->mode & CODING_MODE_LAST_BLOCK)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7165 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7166 /* Flush out unprocessed data as binary chars. We are sure
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7167 that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7168 coding->charbuf. */
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7169 coding->charbuf_used = 0;
100587
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
7170 coding->chars_at_source = 0;
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
7171
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7172 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7173 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7174 int c = *src++;
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
7175
90243
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7176 if (c & 0x80)
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7177 c = BYTE8_TO_CHAR (c);
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7178 coding->charbuf[coding->charbuf_used++] = c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7179 }
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7180 produce_chars (coding, Qnil, 1);
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7181 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7182 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7183 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7184 /* Record unprocessed bytes in coding->carryover. We are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7185 sure that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7186 coding->carryover. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7187 unsigned char *p = coding->carryover;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7188
102115
db1f94e25359 (detect_coding): Don't overflow coding->carryover.
Kenichi Handa <handa@m17n.org>
parents: 102105
diff changeset
7189 if (nbytes > sizeof coding->carryover)
db1f94e25359 (detect_coding): Don't overflow coding->carryover.
Kenichi Handa <handa@m17n.org>
parents: 102105
diff changeset
7190 nbytes = sizeof coding->carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7191 coding->carryover_bytes = nbytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7192 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7193 *p++ = *src++;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7194 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7195 coding->consumed = coding->src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7196 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7197
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7198 if (! EQ (CODING_ID_EOL_TYPE (coding->id), Qunix)
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7199 && !inhibit_eol_conversion)
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
7200 decode_eol (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7201 if (BUFFERP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7202 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7203 current_buffer->undo_list = undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7204 record_insert (coding->dst_pos, coding->produced_char);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7205 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7206 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7207 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7208
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7209
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
7210 /* Extract an annotation datum from a composition starting at POS and
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7211 ending before LIMIT of CODING->src_object (buffer or string), store
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7212 the data in BUF, set *STOP to a starting position of the next
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7213 composition (if any) or to LIMIT, and return the address of the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7214 next element of BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7215
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7216 If such an annotation is not found, set *STOP to a starting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7217 position of a composition after POS (if any) or to LIMIT, and
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7218 return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7219
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7220 static INLINE int *
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7221 handle_composition_annotation (EMACS_INT pos, EMACS_INT limit,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7222 struct coding_system *coding, int *buf,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7223 EMACS_INT *stop)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7224 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7225 EMACS_INT start, end;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7226 Lisp_Object prop;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7227
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7228 if (! find_composition (pos, limit, &start, &end, &prop, coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7229 || end > limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7230 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7231 else if (start > pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7232 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7233 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7234 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7235 if (start == pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7236 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7237 /* We found a composition. Store the corresponding
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7238 annotation data in BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7239 int *head = buf;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7240 enum composition_method method = COMPOSITION_METHOD (prop);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7241 int nchars = COMPOSITION_LENGTH (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7242
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7243 ADD_COMPOSITION_DATA (buf, nchars, 0, method);
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7244 if (method != COMPOSITION_RELATIVE)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7245 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7246 Lisp_Object components;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7247 int len, i, i_byte;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7248
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7249 components = COMPOSITION_COMPONENTS (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7250 if (VECTORP (components))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7251 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7252 len = XVECTOR (components)->size;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7253 for (i = 0; i < len; i++)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7254 *buf++ = XINT (AREF (components, i));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7255 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7256 else if (STRINGP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7257 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7258 len = SCHARS (components);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7259 i = i_byte = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7260 while (i < len)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7261 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7262 FETCH_STRING_CHAR_ADVANCE (*buf, components, i, i_byte);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7263 buf++;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7264 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7265 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7266 else if (INTEGERP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7267 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7268 len = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7269 *buf++ = XINT (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7270 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7271 else if (CONSP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7272 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7273 for (len = 0; CONSP (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7274 len++, components = XCDR (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7275 *buf++ = XINT (XCAR (components));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7276 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7277 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7278 abort ();
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7279 *head -= len;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7280 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7281 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7282
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7283 if (find_composition (end, limit, &start, &end, &prop,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7284 coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7285 && end <= limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7286 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7287 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7288 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7289 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7290 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7291 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7292
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7293
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
7294 /* Extract an annotation datum from a text property `charset' at POS of
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7295 CODING->src_object (buffer of string), store the data in BUF, set
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7296 *STOP to the position where the value of `charset' property changes
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7297 (limiting by LIMIT), and return the address of the next element of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7298 BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7299
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7300 If the property value is nil, set *STOP to the position where the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7301 property value is non-nil (limiting by LIMIT), and return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7302
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7303 static INLINE int *
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7304 handle_charset_annotation (EMACS_INT pos, EMACS_INT limit,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7305 struct coding_system *coding, int *buf,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7306 EMACS_INT *stop)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7307 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7308 Lisp_Object val, next;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7309 int id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7310
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7311 val = Fget_text_property (make_number (pos), Qcharset, coding->src_object);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7312 if (! NILP (val) && CHARSETP (val))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7313 id = XINT (CHARSET_SYMBOL_ID (val));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7314 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7315 id = -1;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7316 ADD_CHARSET_DATA (buf, 0, id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7317 next = Fnext_single_property_change (make_number (pos), Qcharset,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7318 coding->src_object,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7319 make_number (limit));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7320 *stop = XINT (next);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7321 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7322 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7323
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7324
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7325 static void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7326 consume_chars (struct coding_system *coding, Lisp_Object translation_table,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7327 int max_lookup)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7328 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7329 int *buf = coding->charbuf;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7330 int *buf_end = coding->charbuf + coding->charbuf_size;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
7331 const unsigned char *src = coding->source + coding->consumed;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7332 const unsigned char *src_end = coding->source + coding->src_bytes;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7333 EMACS_INT pos = coding->src_pos + coding->consumed_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7334 EMACS_INT end_pos = coding->src_pos + coding->src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7335 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7336 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7337 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7338 EMACS_INT stop, stop_composition, stop_charset;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7339 int *lookup_buf = NULL;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7340
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7341 if (! NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7342 lookup_buf = alloca (sizeof (int) * max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7343
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7344 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7345 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7346 eol_type = Qunix;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7347
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7348 /* Note: composition handling is not yet implemented. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7349 coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7350
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7351 if (NILP (coding->src_object))
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7352 stop = stop_composition = stop_charset = end_pos;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7353 else
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7354 {
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7355 if (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7356 stop = stop_composition = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7357 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7358 stop = stop_composition = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7359 if (coding->common_flags & CODING_ANNOTATE_CHARSET_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7360 stop = stop_charset = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7361 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7362 stop_charset = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7363 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7364
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7365 /* Compensate for CRLF and conversion. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7366 buf_end -= 1 + MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7367 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7368 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7369 Lisp_Object trans;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7370
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7371 if (pos == stop)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7372 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7373 if (pos == end_pos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7374 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7375 if (pos == stop_composition)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7376 buf = handle_composition_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7377 buf, &stop_composition);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7378 if (pos == stop_charset)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7379 buf = handle_charset_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7380 buf, &stop_charset);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7381 stop = (stop_composition < stop_charset
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7382 ? stop_composition : stop_charset);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7383 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7384
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7385 if (! multibytep)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7386 {
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
7387 EMACS_INT bytes;
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
7388
106918
d6e8fa5622b7 Fix ccl encoding of unibyte source.
Kenichi Handa <handa@m17n.org>
parents: 106826
diff changeset
7389 if (coding->encoder == encode_coding_raw_text
d6e8fa5622b7 Fix ccl encoding of unibyte source.
Kenichi Handa <handa@m17n.org>
parents: 106826
diff changeset
7390 || coding->encoder == encode_coding_ccl)
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7391 c = *src++, pos++;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7392 else if ((bytes = MULTIBYTE_LENGTH (src, src_end)) > 0)
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
7393 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos += bytes;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7394 else
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
7395 c = BYTE8_TO_CHAR (*src), src++, pos++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7396 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7397 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
7398 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7399 if ((c == '\r') && (coding->mode & CODING_MODE_SELECTIVE_DISPLAY))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7400 c = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7401 if (! EQ (eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7402 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7403 if (c == '\n')
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
7404 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7405 if (EQ (eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7406 *buf++ = '\r';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7407 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7408 c = '\r';
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
7409 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7410 }
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7411
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
7412 trans = Qnil;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7413 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
7414 if (NILP (trans))
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7415 *buf++ = c;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7416 else
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7417 {
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7418 int from_nchars = 1, to_nchars = 1;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7419 int *lookup_buf_end;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7420 const unsigned char *p = src;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7421 int i;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7422
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7423 lookup_buf[0] = c;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7424 for (i = 1; i < max_lookup && p < src_end; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7425 lookup_buf[i] = STRING_CHAR_ADVANCE (p);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7426 lookup_buf_end = lookup_buf + i;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7427 trans = get_translation (trans, lookup_buf, lookup_buf_end);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7428 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7429 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7430 else if (CONSP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7431 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7432 from_nchars = ASIZE (XCAR (trans));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7433 trans = XCDR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7434 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7435 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7436 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7437 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7438 to_nchars = ASIZE (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7439 if (buf + to_nchars > buf_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7440 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7441 c = XINT (AREF (trans, 0));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7442 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7443 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7444 else
23881
20d595402dea (DECODE_DESIGNATION): Jump to label_invalid_code if
Kenichi Handa <handa@m17n.org>
parents: 23564
diff changeset
7445 break;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7446 *buf++ = c;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7447 for (i = 1; i < to_nchars; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7448 *buf++ = XINT (AREF (trans, i));
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7449 for (i = 1; i < from_nchars; i++, pos++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7450 src += MULTIBYTE_LENGTH_NO_CHECK (src);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7451 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7452 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7453
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7454 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7455 coding->consumed_char = pos - coding->src_pos;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7456 coding->charbuf_used = buf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7457 coding->chars_at_source = 0;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7458 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7459
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7460
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7461 /* Encode the text at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7462 CODING->src_object is a buffer or a string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7463 CODING->dst_object is a buffer or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7464
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7465 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7466 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7467 the source text in the buffer, otherwise. the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7468 gap area of the buffer, and coding->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7469 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7470 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7471 negative and CODING should not have `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7472
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7473 If CODING->src_object is a string, CODING should not have
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7474 `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7475
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7476 If CODING->dst_object is a buffer, the encoded data is inserted at
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7477 the current point of that buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7478
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7479 If CODING->dst_object is nil, the encoded data is placed at the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7480 memory area specified by CODING->destination. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7481
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7482 static int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7483 encode_coding (struct coding_system *coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7484 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7485 Lisp_Object attrs;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
7486 Lisp_Object translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7487 int max_lookup;
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7488 struct ccl_spec cclspec;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7489
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7490 attrs = CODING_ID_ATTRS (coding->id);
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7491 if (coding->encoder == encode_coding_raw_text)
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7492 translation_table = Qnil, max_lookup = 0;
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7493 else
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7494 translation_table = get_translation_table (attrs, 1, &max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7495
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7496 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7497 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7498 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7499 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7500 = ! NILP (current_buffer->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7501 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7502
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7503 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7504 coding->produced = coding->produced_char = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7505 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7506 coding->errors = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7507
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7508 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7509
107507
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7510 if (coding->encoder == encode_coding_ccl)
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7511 {
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7512 coding->spec.ccl = &cclspec;
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7513 setup_ccl_program (&cclspec.ccl, CODING_CCL_ENCODER (coding));
8960853cf85d Fix the ccl encoder for the case that the output buffer is fullfilled.
Kenichi Handa <handa@m17n.org>
parents: 107506
diff changeset
7514 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7515 do {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7516 coding_set_source (coding);
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7517 consume_chars (coding, translation_table, max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7518 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7519 (*(coding->encoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7520 } while (coding->consumed_char < coding->src_chars);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7521
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
7522 if (BUFFERP (coding->dst_object) && coding->produced_char > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7523 insert_from_gap (coding->produced_char, coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7524
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7525 return (coding->result);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7526 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7527
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7528
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7529 /* Name (or base name) of work buffer for code conversion. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7530 static Lisp_Object Vcode_conversion_workbuf_name;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7531
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7532 /* A working buffer used by the top level conversion. Once it is
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7533 created, it is never destroyed. It has the name
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7534 Vcode_conversion_workbuf_name. The other working buffers are
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7535 destroyed after the use is finished, and their names are modified
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7536 versions of Vcode_conversion_workbuf_name. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7537 static Lisp_Object Vcode_conversion_reused_workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7538
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7539 /* 1 iff Vcode_conversion_reused_workbuf is already in use. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7540 static int reused_workbuf_in_use;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7541
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7542
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
7543 /* Return a working buffer of code conversion. MULTIBYTE specifies the
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7544 multibyteness of returning buffer. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7545
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7546 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7547 make_conversion_work_buffer (int multibyte)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7548 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7549 Lisp_Object name, workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7550 struct buffer *current;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7551
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7552 if (reused_workbuf_in_use++)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7553 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7554 name = Fgenerate_new_buffer_name (Vcode_conversion_workbuf_name, Qnil);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7555 workbuf = Fget_buffer_create (name);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7556 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7557 else
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7558 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
7559 if (NILP (Fbuffer_live_p (Vcode_conversion_reused_workbuf)))
98186
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7560 Vcode_conversion_reused_workbuf
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7561 = Fget_buffer_create (Vcode_conversion_workbuf_name);
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7562 workbuf = Vcode_conversion_reused_workbuf;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7563 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7564 current = current_buffer;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7565 set_buffer_internal (XBUFFER (workbuf));
100262
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7566 /* We can't allow modification hooks to run in the work buffer. For
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7567 instance, directory_files_internal assumes that file decoding
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7568 doesn't compile new regexps. */
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7569 Fset (Fmake_local_variable (Qinhibit_modification_hooks), Qt);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
7570 Ferase_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7571 current_buffer->undo_list = Qt;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7572 current_buffer->enable_multibyte_characters = multibyte ? Qt : Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7573 set_buffer_internal (current);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7574 return workbuf;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7575 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7576
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7577
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7578 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7579 code_conversion_restore (Lisp_Object arg)
26067
f54ca66e2571 (code_convert_string): Add record_unwind_protect to
Kenichi Handa <handa@m17n.org>
parents: 25860
diff changeset
7580 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7581 Lisp_Object current, workbuf;
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7582 struct gcpro gcpro1;
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7583
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7584 GCPRO1 (arg);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7585 current = XCAR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7586 workbuf = XCDR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7587 if (! NILP (workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7588 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7589 if (EQ (workbuf, Vcode_conversion_reused_workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7590 reused_workbuf_in_use = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7591 else if (! NILP (Fbuffer_live_p (workbuf)))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7592 Fkill_buffer (workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7593 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7594 set_buffer_internal (XBUFFER (current));
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7595 UNGCPRO;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7596 return Qnil;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7597 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7598
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7599 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
7600 code_conversion_save (int with_work_buf, int multibyte)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7601 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7602 Lisp_Object workbuf = Qnil;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7603
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7604 if (with_work_buf)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7605 workbuf = make_conversion_work_buffer (multibyte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7606 record_unwind_protect (code_conversion_restore,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7607 Fcons (Fcurrent_buffer (), workbuf));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7608 return workbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7609 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7610
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7611 int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7612 decode_coding_gap (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7613 EMACS_INT chars, EMACS_INT bytes)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7614 {
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
7615 int count = SPECPDL_INDEX ();
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7616 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7617
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7618 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7619
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7620 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7621 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7622 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7623 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7624 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7625 coding->src_multibyte = chars < bytes;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7626 coding->dst_object = coding->src_object;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7627 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7628 coding->dst_pos_byte = PT_BYTE;
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
7629 coding->dst_multibyte = ! NILP (current_buffer->enable_multibyte_characters);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7630
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7631 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7632 detect_coding (coding);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7633
90350
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
7634 coding->mode |= CODING_MODE_LAST_BLOCK;
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7635 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7636 decode_coding (coding);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7637 current_buffer->text->inhibit_shrinking = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7638
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7639 attrs = CODING_ID_ATTRS (coding->id);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7640 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7641 {
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7642 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7643 Lisp_Object val;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7644
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7645 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7646 val = call1 (CODING_ATTR_POST_READ (attrs),
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7647 make_number (coding->produced_char));
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7648 CHECK_NATNUM (val);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7649 coding->produced_char += Z - prev_Z;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7650 coding->produced += Z_BYTE - prev_Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7651 }
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7652
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7653 unbind_to (count, Qnil);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7654 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7655 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7656
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7657 int
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7658 encode_coding_gap (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7659 EMACS_INT chars, EMACS_INT bytes)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7660 {
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
7661 int count = SPECPDL_INDEX ();
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7662
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7663 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7664
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7665 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7666 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7667 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7668 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7669 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7670 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7671 coding->dst_object = coding->src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7672 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7673 coding->dst_pos_byte = PT_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7674
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7675 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7676
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7677 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7678 return coding->result;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7679 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7680
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7681
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7682 /* Decode the text in the range FROM/FROM_BYTE and TO/TO_BYTE in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7683 SRC_OBJECT into DST_OBJECT by coding context CODING.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7684
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7685 SRC_OBJECT is a buffer, a string, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7686
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7687 If it is a buffer, the text is at point of the buffer. FROM and TO
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7688 are positions in the buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7689
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7690 If it is a string, the text is at the beginning of the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7691 FROM and TO are indices to the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7692
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7693 If it is nil, the text is at coding->source. FROM and TO are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7694 indices to coding->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7695
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7696 DST_OBJECT is a buffer, Qt, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7697
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7698 If it is a buffer, the decoded text is inserted at point of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7699 buffer. If the buffer is the same as SRC_OBJECT, the source text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7700 is deleted.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7701
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7702 If it is Qt, a string is made from the decoded text, and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7703 set in CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7704
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7705 If it is Qnil, the decoded text is stored at CODING->destination.
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7706 The caller must allocate CODING->dst_bytes bytes at
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7707 CODING->destination by xmalloc. If the decoded text is longer than
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7708 CODING->dst_bytes, CODING->destination is relocated by xrealloc.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7709 */
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7710
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7711 void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7712 decode_coding_object (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7713 Lisp_Object src_object,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7714 EMACS_INT from, EMACS_INT from_byte,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7715 EMACS_INT to, EMACS_INT to_byte,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7716 Lisp_Object dst_object)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7717 {
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
7718 int count = SPECPDL_INDEX ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7719 unsigned char *destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7720 EMACS_INT dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7721 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7722 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7723 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7724 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7725 int need_marker_adjustment = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7726 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7727
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7728 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7729
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7730 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7731 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7732 destination = coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7733 dst_bytes = coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7734 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7735
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7736 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7737 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7738 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7739 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7740
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7741 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7742 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7743 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7744 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7745 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7746 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7747 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7748 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7749 if (from != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7750 move_gap_both (from, from_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7751 if (EQ (src_object, dst_object))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7752 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7753 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7754
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7755 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7756 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7757 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7758 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7759 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7760 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7761 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7762 TEMP_SET_PT_BOTH (from, from_byte);
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7763 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7764 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7765 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7766 coding->src_pos_byte = -bytes;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
7767 }
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7768 else
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7769 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7770 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7771 coding->src_pos_byte = from_byte;
29985
c17e78d8c720 (code_convert_region): Even if the length of text is
Kenichi Handa <handa@m17n.org>
parents: 29932
diff changeset
7772 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7773 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7774
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7775 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7776 detect_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7777 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7778
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7779 if (EQ (dst_object, Qt)
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7780 || (! NILP (CODING_ATTR_POST_READ (attrs))
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7781 && NILP (dst_object)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7782 {
93321
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7783 coding->dst_multibyte = !CODING_FOR_UNIBYTE (coding);
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7784 coding->dst_object = code_conversion_save (1, coding->dst_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7785 coding->dst_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7786 coding->dst_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7787 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7788 else if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7789 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7790 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7791 coding->dst_object = dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7792 coding->dst_pos = BUF_PT (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7793 coding->dst_pos_byte = BUF_PT_BYTE (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7794 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7795 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7796 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7797 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
7798 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7799 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7800 coding->dst_object = Qnil;
93322
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7801 /* Most callers presume this will return a multibyte result, and they
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7802 won't use `binary' or `raw-text' anyway, so let's not worry about
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7803 CODING_FOR_UNIBYTE. */
93323
06e93ffa2e9f (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93322
diff changeset
7804 coding->dst_multibyte = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7805 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7806
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7807 decode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7808
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7809 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7810 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7811
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7812 if (! NILP (CODING_ATTR_POST_READ (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7813 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7814 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7815 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7816 Lisp_Object val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7817
88506
a7f0d13affa5 (decode_coding_object): Move point to coding->dst_pos before
Kenichi Handa <handa@m17n.org>
parents: 88497
diff changeset
7818 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7819 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7820 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7821 val = safe_call1 (CODING_ATTR_POST_READ (attrs),
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7822 make_number (coding->produced_char));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7823 UNGCPRO;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7824 CHECK_NATNUM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7825 coding->produced_char += Z - prev_Z;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7826 coding->produced += Z_BYTE - prev_Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7827 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7828
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7829 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7830 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7831 coding->dst_object = Fbuffer_string ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7832 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7833 else if (NILP (dst_object) && BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7834 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7835 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7836 if (dst_bytes < coding->produced)
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
7837 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7838 destination = xrealloc (destination, coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7839 if (! destination)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7840 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7841 record_conversion_result (coding,
107174
e98bd64897e0 Fix handling of CODING_RESULT_INSUFFICIENT_DST.
Kenichi Handa <handa@m17n.org>
parents: 107171
diff changeset
7842 CODING_RESULT_INSUFFICIENT_MEM);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7843 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7844 return;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7845 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7846 if (BEGV < GPT && GPT < BEGV + coding->produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7847 move_gap_both (BEGV, BEGV_BYTE);
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
7848 memcpy (destination, BEGV_ADDR, coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7849 coding->destination = destination;
23279
ca159e828a68 (ccl_coding_driver): If ccl_driver is interrupted by a
Kenichi Handa <handa@m17n.org>
parents: 23258
diff changeset
7850 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7851 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7852
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7853 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7854 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7855 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7856 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7857 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7858 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7859 set_buffer_internal (XBUFFER (src_object));
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7860 current_buffer->text->inhibit_shrinking = 0;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7861 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7862 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7863 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7864 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7865 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7866 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7867 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7868 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7869 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7870 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7871
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7872 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7873 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7874 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7875
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7876 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7877 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7878 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7879 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7880 if (tail->insertion_type)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7881 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7882 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7883 tail->charpos = from;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7884 }
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7885 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7886 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7887 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7888 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7889 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7890 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7891 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7892 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7893 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7894 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7895
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7896 Vdeactivate_mark = old_deactivate_mark;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7897 unbind_to (count, coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7898 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7899
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7900
29275
b4ea9178e480 (DECODE_COMPOSITION_START): If coding->cmp_data is not
Kenichi Handa <handa@m17n.org>
parents: 29247
diff changeset
7901 void
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7902 encode_coding_object (struct coding_system *coding,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7903 Lisp_Object src_object,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7904 EMACS_INT from, EMACS_INT from_byte,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7905 EMACS_INT to, EMACS_INT to_byte,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
7906 Lisp_Object dst_object)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7907 {
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
7908 int count = SPECPDL_INDEX ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7909 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7910 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7911 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7912 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7913 int need_marker_adjustment = 0;
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7914 int kill_src_buffer = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7915 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7916
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7917 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7918
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7919 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7920 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7921 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7922 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7923
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7924 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7925
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7926 if (EQ (src_object, dst_object))
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7927 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7928 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7929
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7930 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7931 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7932 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7933 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7934 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7935 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7936 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7937
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7938 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
21062
839b22ad1e42 (code_convert_region): Handle the case that codes
Kenichi Handa <handa@m17n.org>
parents: 20999
diff changeset
7939 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7940 coding->src_object = code_conversion_save (1, coding->src_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7941 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7942 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7943 insert_from_string (src_object, from, from_byte, chars, bytes, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7944 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7945 insert_from_buffer (XBUFFER (src_object), from, chars, 0);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7946 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7947 insert_1_both (coding->source + from, chars, bytes, 0, 0, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7948
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7949 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7950 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7951 set_buffer_internal (XBUFFER (src_object));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7952 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7953 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7954 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7955 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7956
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7957 {
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7958 Lisp_Object args[3];
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7959 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7960
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7961 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7962 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7963 args[0] = CODING_ATTR_PRE_WRITE (attrs);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7964 args[1] = make_number (BEG);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7965 args[2] = make_number (Z);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7966 safe_call (3, args);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7967 UNGCPRO;
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7968 }
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7969 if (XBUFFER (coding->src_object) != current_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7970 kill_src_buffer = 1;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7971 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7972 if (BEG != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7973 move_gap_both (BEG, BEG_BYTE);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7974 coding->src_chars = Z - BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7975 coding->src_bytes = Z_BYTE - BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7976 coding->src_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7977 coding->src_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7978 coding->src_multibyte = Z < Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7979 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7980 else if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7981 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7982 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7983 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7984 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7985 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7986 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7987 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7988 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7989 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7990 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7991 {
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7992 saved_pt = PT, saved_pt_byte = PT_BYTE;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7993 coding->src_object = del_range_1 (from, to, 1, 1);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7994 coding->src_pos = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7995 coding->src_pos_byte = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7996 }
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
7997 else
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
7998 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7999 if (from < GPT && to >= GPT)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8000 move_gap_both (from, from_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8001 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8002 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8003 }
64308
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
8004 }
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
8005 else
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8006 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8007
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8008 if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8009 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8010 coding->dst_object = dst_object;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8011 if (EQ (src_object, dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8012 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8013 coding->dst_pos = from;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8014 coding->dst_pos_byte = from_byte;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8015 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8016 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8017 {
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8018 struct buffer *current = current_buffer;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8019
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8020 set_buffer_temp (XBUFFER (dst_object));
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8021 coding->dst_pos = PT;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8022 coding->dst_pos_byte = PT_BYTE;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8023 move_gap_both (coding->dst_pos, coding->dst_pos_byte);
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8024 set_buffer_temp (current);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8025 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8026 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8027 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8028 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8029 else if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8030 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8031 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8032 coding->dst_bytes = coding->src_chars;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8033 if (coding->dst_bytes == 0)
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8034 coding->dst_bytes = 1;
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8035 coding->destination = (unsigned char *) xmalloc (coding->dst_bytes);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8036 coding->dst_multibyte = 0;
65506
f376635f5061 (code_convert_region_unwind): Argument format changed.
Kenichi Handa <handa@m17n.org>
parents: 64770
diff changeset
8037 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8038 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
8039 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8040 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8041 coding->dst_multibyte = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8042 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8043
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8044 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8045
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8046 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8047 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8048 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8049 coding->dst_object = Fbuffer_string ();
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
8050 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8051 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8052 coding->dst_object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8053 = make_unibyte_string ((char *) coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8054 coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8055 xfree (coding->destination);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8056 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8057 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8058
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8059 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8060 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8061 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8062 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8063 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8064 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8065 set_buffer_internal (XBUFFER (src_object));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8066 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8067 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8068 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8069 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8070 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8071 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8072 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8073 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8074 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8075 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8076
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8077 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8078 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8079 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8080
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8081 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8082 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8083 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8084 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8085 if (tail->insertion_type)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8086 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8087 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8088 tail->charpos = from;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8089 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8090 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8091 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8092 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8093 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8094 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8095 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8096 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8097 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8098 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8099 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8100
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
8101 if (kill_src_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
8102 Fkill_buffer (coding->src_object);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
8103
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
8104 Vdeactivate_mark = old_deactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8105 unbind_to (count, Qnil);
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8106 }
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8107
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8108
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8109 Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
8110 preferred_coding_system (void)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8111 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8112 int id = coding_categories[coding_priorities[0]].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8113
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8114 return CODING_ID_NAME (id);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8115 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8116
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8117
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8118 #ifdef emacs
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
8119 /*** 8. Emacs Lisp library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8120
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8121 DEFUN ("coding-system-p", Fcoding_system_p, Scoding_system_p, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8122 doc: /* Return t if OBJECT is nil or a coding-system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8123 See the documentation of `define-coding-system' for information
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8124 about coding-system objects. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8125 (Lisp_Object object)
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8126 {
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8127 if (NILP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8128 || CODING_SYSTEM_ID (object) >= 0)
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8129 return Qt;
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8130 if (! SYMBOLP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8131 || NILP (Fget (object, Qcoding_system_define_form)))
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8132 return Qnil;
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
8133 return Qt;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8134 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8135
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8136 DEFUN ("read-non-nil-coding-system", Fread_non_nil_coding_system,
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8137 Sread_non_nil_coding_system, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8138 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8139 (Lisp_Object prompt)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8140 {
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
8141 Lisp_Object val;
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8142 do
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8143 {
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8144 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8145 Qt, Qnil, Qcoding_system_history, Qnil, Qnil);
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8146 }
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8147 while (SCHARS (val) == 0);
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
8148 return (Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8149 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8150
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8151 DEFUN ("read-coding-system", Fread_coding_system, Sread_coding_system, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8152 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT.
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8153 If the user enters null input, return second argument DEFAULT-CODING-SYSTEM.
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8154 Ignores case when completing coding systems (all Emacs coding systems
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8155 are lower-case). */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8156 (Lisp_Object prompt, Lisp_Object default_coding_system)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8157 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
8158 Lisp_Object val;
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8159 int count = SPECPDL_INDEX ();
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8160
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8161 if (SYMBOLP (default_coding_system))
45396
cab845213388 * coding.c (Fread_coding_system, code_convert_region1)
Ken Raeburn <raeburn@raeburn.org>
parents: 45239
diff changeset
8162 default_coding_system = SYMBOL_NAME (default_coding_system);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8163 specbind (Qcompletion_ignore_case, Qt);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8164 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8165 Qt, Qnil, Qcoding_system_history,
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8166 default_coding_system, Qnil);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8167 unbind_to (count, Qnil);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8168 return (SCHARS (val) == 0 ? Qnil : Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8169 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8170
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8171 DEFUN ("check-coding-system", Fcheck_coding_system, Scheck_coding_system,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8172 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8173 doc: /* Check validity of CODING-SYSTEM.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8174 If valid, return CODING-SYSTEM, else signal a `coding-system-error' error.
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
8175 It is valid if it is nil or a symbol defined as a coding system by the
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
8176 function `define-coding-system'. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8177 (Lisp_Object coding_system)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8178 {
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8179 Lisp_Object define_form;
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8180
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8181 define_form = Fget (coding_system, Qcoding_system_define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8182 if (! NILP (define_form))
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8183 {
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8184 Fput (coding_system, Qcoding_system_define_form, Qnil);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8185 safe_eval (define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8186 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8187 if (!NILP (Fcoding_system_p (coding_system)))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8188 return coding_system;
71972
eaa3c19b94d2 (Fcheck_coding_system): Use xsignal1. Remove loop.
Kim F. Storm <storm@cua.dk>
parents: 71084
diff changeset
8189 xsignal1 (Qcoding_system_error, coding_system);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8190 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8191
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8192
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8193 /* Detect how the bytes at SRC of length SRC_BYTES are encoded. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8194 HIGHEST is nonzero, return the coding system of the highest
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
8195 priority among the detected coding systems. Otherwise return a
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8196 list of detected coding systems sorted by their priorities. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8197 MULTIBYTEP is nonzero, it is assumed that the bytes are in correct
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8198 multibyte form but contains only ASCII and eight-bit chars.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8199 Otherwise, the bytes are raw bytes.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8200
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8201 CODING-SYSTEM controls the detection as below:
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8202
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8203 If it is nil, detect both text-format and eol-format. If the
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8204 text-format part of CODING-SYSTEM is already specified
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8205 (e.g. `iso-latin-1'), detect only eol-format. If the eol-format
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8206 part of CODING-SYSTEM is already specified (e.g. `undecided-unix'),
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8207 detect only text-format. */
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8208
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8209 Lisp_Object
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8210 detect_coding_system (const unsigned char *src,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8211 EMACS_INT src_chars, EMACS_INT src_bytes,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8212 int highest, int multibytep,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8213 Lisp_Object coding_system)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8214 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8215 const unsigned char *src_end = src + src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8216 Lisp_Object attrs, eol_type;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8217 Lisp_Object val = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8218 struct coding_system coding;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8219 int id;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8220 struct coding_detection_info detect_info;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8221 enum coding_category base_category;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8222 int null_byte_found = 0, eight_bit_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8223
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8224 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8225 coding_system = Qundecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8226 setup_coding_system (coding_system, &coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8227 attrs = CODING_ID_ATTRS (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8228 eol_type = CODING_ID_EOL_TYPE (coding.id);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8229 coding_system = CODING_ATTR_BASE_NAME (attrs);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8230
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8231 coding.source = src;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8232 coding.src_chars = src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8233 coding.src_bytes = src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8234 coding.src_multibyte = multibytep;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8235 coding.consumed = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8236 coding.mode |= CODING_MODE_LAST_BLOCK;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8237 coding.head_ascii = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8238
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8239 detect_info.checked = detect_info.found = detect_info.rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8240
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8241 /* At first, detect text-format if necessary. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8242 base_category = XINT (CODING_ATTR_CATEGORY (attrs));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8243 if (base_category == coding_category_undecided)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8244 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8245 enum coding_category category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8246 struct coding_system *this;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8247 int c, i;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8248
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8249 /* Skip all ASCII bytes except for a few ISO2022 controls. */
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8250 for (; src < src_end; src++)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8251 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8252 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8253 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8254 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8255 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8256 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8257 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8258 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8259 else if (c < 0x20)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8260 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8261 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8262 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8263 && ! detect_info.checked)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8264 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8265 if (detect_coding_iso_2022 (&coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8266 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8267 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8268 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8269 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8270 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8271 have found a null-byte, but it's very
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8272 rare that a binary file confirm to
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8273 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8274 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8275 coding.head_ascii = src - coding.source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8276 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8277 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8278 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8279 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8280 }
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
8281 else if (! c && !inhibit_null_byte_detection)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8282 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8283 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8284 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8285 break;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8286 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8287 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8288 coding.head_ascii++;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8289 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8290 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8291 coding.head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8292 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8293
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8294 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8295 || coding.head_ascii < coding.src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8296 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8297 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8298 if (coding.head_ascii == coding.src_bytes)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8299 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8300 for (i = 0; i < coding_category_raw_text; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8301 {
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8302 category = coding_priorities[i];
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8303 this = coding_categories + category;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8304 if (detect_info.found & (1 << category))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8305 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8306 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8307 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8308 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8309 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8310 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8311 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8312 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8313 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8314 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8315 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8316 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8317 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8318
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8319 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8320 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8321 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8322 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8323 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8324 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8325 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8326 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8327 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8328 if (highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8329 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8330 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8331 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8332 else if ((*(this->detector)) (&coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8333 && highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8334 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8335 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8336 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8337 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8338 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8339 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8340 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8341 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8342 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8343 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8344 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8345 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8346 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8347 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8348
101197
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8349 if ((detect_info.rejected & CATEGORY_MASK_ANY) == CATEGORY_MASK_ANY
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8350 || null_byte_found)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8351 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8352 detect_info.found = CATEGORY_MASK_RAW_TEXT;
101197
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8353 id = CODING_SYSTEM_ID (Qno_conversion);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8354 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8355 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8356 else if (! detect_info.rejected && ! detect_info.found)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8357 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8358 detect_info.found = CATEGORY_MASK_ANY;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8359 id = coding_categories[coding_category_undecided].id;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8360 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8361 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8362 else if (highest)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8363 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8364 if (detect_info.found)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8365 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8366 detect_info.found = 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8367 val = Fcons (make_number (this->id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8368 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8369 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8370 for (i = 0; i < coding_category_raw_text; i++)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8371 if (! (detect_info.rejected & (1 << coding_priorities[i])))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8372 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8373 detect_info.found = 1 << coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8374 id = coding_categories[coding_priorities[i]].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8375 val = Fcons (make_number (id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8376 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8377 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8378 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8379 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8380 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8381 int mask = detect_info.rejected | detect_info.found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8382 int found = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8383
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8384 for (i = coding_category_raw_text - 1; i >= 0; i--)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8385 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8386 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8387 if (! (mask & (1 << category)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8388 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8389 found |= 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8390 id = coding_categories[category].id;
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8391 if (id >= 0)
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8392 val = Fcons (make_number (id), val);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8393 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8394 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8395 for (i = coding_category_raw_text - 1; i >= 0; i--)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8396 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8397 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8398 if (detect_info.found & (1 << category))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8399 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8400 id = coding_categories[category].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8401 val = Fcons (make_number (id), val);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8402 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8403 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8404 detect_info.found |= found;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8405 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8406 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8407 else if (base_category == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8408 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8409 if (detect_coding_utf_8 (&coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8410 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8411 struct coding_system *this;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8412
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8413 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8414 this = coding_categories + coding_category_utf_8_sig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8415 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8416 this = coding_categories + coding_category_utf_8_nosig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8417 val = Fcons (make_number (this->id), Qnil);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8418 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8419 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8420 else if (base_category == coding_category_utf_16_auto)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8421 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8422 if (detect_coding_utf_16 (&coding, &detect_info))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8423 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8424 struct coding_system *this;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8425
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8426 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8427 this = coding_categories + coding_category_utf_16_le;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8428 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8429 this = coding_categories + coding_category_utf_16_be;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8430 else if (detect_info.rejected & CATEGORY_MASK_UTF_16_LE_NOSIG)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8431 this = coding_categories + coding_category_utf_16_be_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8432 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8433 this = coding_categories + coding_category_utf_16_le_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8434 val = Fcons (make_number (this->id), Qnil);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8435 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8436 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8437 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8438 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8439 detect_info.found = 1 << XINT (CODING_ATTR_CATEGORY (attrs));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8440 val = Fcons (make_number (coding.id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8441 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8442
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8443 /* Then, detect eol-format if necessary. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8444 {
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8445 int normal_eol = -1, utf_16_be_eol = -1, utf_16_le_eol = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8446 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8447
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8448 if (VECTORP (eol_type))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8449 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8450 if (detect_info.found & ~CATEGORY_MASK_UTF_16)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8451 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8452 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8453 normal_eol = EOL_SEEN_LF;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8454 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8455 normal_eol = detect_eol (coding.source, src_bytes,
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8456 coding_category_raw_text);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8457 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8458 if (detect_info.found & (CATEGORY_MASK_UTF_16_BE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8459 | CATEGORY_MASK_UTF_16_BE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8460 utf_16_be_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8461 coding_category_utf_16_be);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8462 if (detect_info.found & (CATEGORY_MASK_UTF_16_LE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8463 | CATEGORY_MASK_UTF_16_LE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8464 utf_16_le_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8465 coding_category_utf_16_le);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8466 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8467 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8468 {
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8469 if (EQ (eol_type, Qunix))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8470 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_LF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8471 else if (EQ (eol_type, Qdos))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8472 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CRLF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8473 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8474 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CR;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8475 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8476
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8477 for (tail = val; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8478 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8479 enum coding_category category;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8480 int this_eol;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8481
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8482 id = XINT (XCAR (tail));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8483 attrs = CODING_ID_ATTRS (id);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8484 category = XINT (CODING_ATTR_CATEGORY (attrs));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8485 eol_type = CODING_ID_EOL_TYPE (id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8486 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8487 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8488 if (category == coding_category_utf_16_be
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8489 || category == coding_category_utf_16_be_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8490 this_eol = utf_16_be_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8491 else if (category == coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8492 || category == coding_category_utf_16_le_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8493 this_eol = utf_16_le_eol;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8494 else
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8495 this_eol = normal_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8496
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8497 if (this_eol == EOL_SEEN_LF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8498 XSETCAR (tail, AREF (eol_type, 0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8499 else if (this_eol == EOL_SEEN_CRLF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8500 XSETCAR (tail, AREF (eol_type, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8501 else if (this_eol == EOL_SEEN_CR)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8502 XSETCAR (tail, AREF (eol_type, 2));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8503 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8504 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8505 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8506 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8507 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8508 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8509 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8510
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8511 return (highest ? (CONSP (val) ? XCAR (val) : Qnil) : val);
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
8512 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8513
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8514
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8515 DEFUN ("detect-coding-region", Fdetect_coding_region, Sdetect_coding_region,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8516 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8517 doc: /* Detect coding system of the text in the region between START and END.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8518 Return a list of possible coding systems ordered by priority.
102737
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
8519 The coding systems to try and their priorities follows what
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
8520 the function `coding-system-priority-list' (which see) returns.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8521
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8522 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8523 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8524 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8525 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8526
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8527 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8528 highest priority. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8529 (Lisp_Object start, Lisp_Object end, Lisp_Object highest)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8530 {
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8531 int from, to;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8532 int from_byte, to_byte;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8533
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8534 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8535 CHECK_NUMBER_COERCE_MARKER (end);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8536
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8537 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8538 from = XINT (start), to = XINT (end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8539 from_byte = CHAR_TO_BYTE (from);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8540 to_byte = CHAR_TO_BYTE (to);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8541
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8542 if (from < GPT && to >= GPT)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8543 move_gap_both (to, to_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8544
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8545 return detect_coding_system (BYTE_POS_ADDR (from_byte),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8546 to - from, to_byte - from_byte,
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8547 !NILP (highest),
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8548 !NILP (current_buffer
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8549 ->enable_multibyte_characters),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8550 Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8551 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8552
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8553 DEFUN ("detect-coding-string", Fdetect_coding_string, Sdetect_coding_string,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8554 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8555 doc: /* Detect coding system of the text in STRING.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8556 Return a list of possible coding systems ordered by priority.
102738
41e7ab490f69 (Fdetect_coding_string): Improve the docstrings.
Kenichi Handa <handa@m17n.org>
parents: 102737
diff changeset
8557 The coding systems to try and their priorities follows what
41e7ab490f69 (Fdetect_coding_string): Improve the docstrings.
Kenichi Handa <handa@m17n.org>
parents: 102737
diff changeset
8558 the function `coding-system-priority-list' (which see) returns.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8559
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8560 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8561 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8562 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8563 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8564
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8565 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8566 highest priority. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8567 (Lisp_Object string, Lisp_Object highest)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8568 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8569 CHECK_STRING (string);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8570
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8571 return detect_coding_system (SDATA (string),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8572 SCHARS (string), SBYTES (string),
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8573 !NILP (highest), STRING_MULTIBYTE (string),
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8574 Qnil);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8575 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8576
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8577
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8578 static INLINE int
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
8579 char_encodable_p (int c, Lisp_Object attrs)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8580 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8581 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8582 struct charset *charset;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8583 Lisp_Object translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8584
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8585 translation_table = CODING_ATTR_TRANS_TBL (attrs);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
8586 if (! NILP (translation_table))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8587 c = translate_char (translation_table, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8588 for (tail = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8589 CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8590 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8591 charset = CHARSET_FROM_ID (XINT (XCAR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8592 if (CHAR_CHARSET_P (c, charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8593 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8594 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8595 return (! NILP (tail));
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8596 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8597
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8598
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8599 /* Return a list of coding systems that safely encode the text between
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8600 START and END. If EXCLUDE is non-nil, it is a list of coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8601 systems not to check. The returned list doesn't contain any such
88889
4548f224c603 (Ffind_coding_systems_region_internal): Detect an
Kenichi Handa <handa@m17n.org>
parents: 88876
diff changeset
8602 coding systems. In any case, if the text contains only ASCII or is
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8603 unibyte, return t. */
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8604
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8605 DEFUN ("find-coding-systems-region-internal",
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8606 Ffind_coding_systems_region_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8607 Sfind_coding_systems_region_internal, 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8608 doc: /* Internal use only. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8609 (Lisp_Object start, Lisp_Object end, Lisp_Object exclude)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8610 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8611 Lisp_Object coding_attrs_list, safe_codings;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8612 EMACS_INT start_byte, end_byte;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8613 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8614 int c;
103486
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8615 Lisp_Object tail, elt, work_table;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8616
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8617 if (STRINGP (start))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8618 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8619 if (!STRING_MULTIBYTE (start)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8620 || SCHARS (start) == SBYTES (start))
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8621 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8622 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8623 end_byte = SBYTES (start);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8624 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8625 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8626 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8627 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8628 CHECK_NUMBER_COERCE_MARKER (end);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8629 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8630 args_out_of_range (start, end);
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8631 if (NILP (current_buffer->enable_multibyte_characters))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8632 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8633 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8634 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8635 if (XINT (end) - XINT (start) == end_byte - start_byte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8636 return Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8637
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8638 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8639 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8640 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8641 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8642 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8643 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8644 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8645 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8646
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8647 coding_attrs_list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8648 for (tail = Vcoding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8649 if (NILP (exclude)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8650 || NILP (Fmemq (XCAR (tail), exclude)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8651 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8652 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8653
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8654 attrs = AREF (CODING_SYSTEM_SPEC (XCAR (tail)), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8655 if (EQ (XCAR (tail), CODING_ATTR_BASE_NAME (attrs))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8656 && ! EQ (CODING_ATTR_TYPE (attrs), Qundecided))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8657 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8658 ASET (attrs, coding_attr_trans_tbl,
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8659 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8660 coding_attrs_list = Fcons (attrs, coding_attrs_list);
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8661 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8662 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8663
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8664 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8665 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8666 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8667 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8668 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8669
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8670 while (p < pend && ASCII_BYTE_P (*p)) p++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8671 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8672
103486
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8673 work_table = Fmake_char_table (Qnil, Qnil);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8674 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8675 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8676 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8677 p++;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8678 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8679 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8680 c = STRING_CHAR_ADVANCE (p);
103486
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8681 if (!NILP (char_table_ref (work_table, c)))
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8682 /* This character was already checked. Ignore it. */
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8683 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8684
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8685 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8686 for (tail = coding_attrs_list; CONSP (tail);)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8687 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8688 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8689 if (NILP (elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8690 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8691 else if (char_encodable_p (c, elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8692 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8693 else if (CONSP (XCDR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8694 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8695 XSETCAR (tail, XCAR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8696 XSETCDR (tail, XCDR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8697 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8698 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8699 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8700 XSETCAR (tail, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8701 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8702 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8703 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8704 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8705 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8706 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8707
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8708 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8709 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8710 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8711 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8712 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8713 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8714 }
103486
091a55d2d6f7 (Ffind_coding_systems_region_internal): Cache checked characters.
YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
parents: 103474
diff changeset
8715 char_table_set (work_table, c, Qt);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8716 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8717 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8718
89905
37e044cc35f6 (Ffind_coding_systems_region_internal): Include raw-text and
Kenichi Handa <handa@m17n.org>
parents: 89892
diff changeset
8719 safe_codings = list2 (Qraw_text, Qno_conversion);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8720 for (tail = coding_attrs_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8721 if (! NILP (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8722 safe_codings = Fcons (CODING_ATTR_BASE_NAME (XCAR (tail)), safe_codings);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8723
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8724 return safe_codings;
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8725 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8726
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8727
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8728 DEFUN ("unencodable-char-position", Funencodable_char_position,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8729 Sunencodable_char_position, 3, 5, 0,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8730 doc: /*
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8731 Return position of first un-encodable character in a region.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8732 START and END specify the region and CODING-SYSTEM specifies the
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8733 encoding to check. Return nil if CODING-SYSTEM does encode the region.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8734
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8735 If optional 4th argument COUNT is non-nil, it specifies at most how
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8736 many un-encodable characters to search. In this case, the value is a
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8737 list of positions.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8738
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8739 If optional 5th argument STRING is non-nil, it is a string to search
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8740 for un-encodable characters. In that case, START and END are indexes
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8741 to the string. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8742 (Lisp_Object start, Lisp_Object end, Lisp_Object coding_system, Lisp_Object count, Lisp_Object string)
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8743 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8744 int n;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8745 struct coding_system coding;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8746 Lisp_Object attrs, charset_list, translation_table;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8747 Lisp_Object positions;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8748 int from, to;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8749 const unsigned char *p, *stop, *pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8750 int ascii_compatible;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8751
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8752 setup_coding_system (Fcheck_coding_system (coding_system), &coding);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8753 attrs = CODING_ID_ATTRS (coding.id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8754 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8755 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8756 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8757 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8758 translation_table = get_translation_table (attrs, 1, NULL);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8759
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8760 if (NILP (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8761 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8762 validate_region (&start, &end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8763 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8764 to = XINT (end);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8765 if (NILP (current_buffer->enable_multibyte_characters)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8766 || (ascii_compatible
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8767 && (to - from) == (CHAR_TO_BYTE (to) - (CHAR_TO_BYTE (from)))))
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8768 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8769 p = CHAR_POS_ADDR (from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8770 pend = CHAR_POS_ADDR (to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8771 if (from < GPT && to >= GPT)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8772 stop = GPT_ADDR;
48829
f6c59ca557c7 (Funencodable_char_position): Set pend correctly.
Kenichi Handa <handa@m17n.org>
parents: 48230
diff changeset
8773 else
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8774 stop = pend;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8775 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8776 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8777 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8778 CHECK_STRING (string);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8779 CHECK_NATNUM (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8780 CHECK_NATNUM (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8781 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8782 to = XINT (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8783 if (from > to
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8784 || to > SCHARS (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8785 args_out_of_range_3 (string, start, end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8786 if (! STRING_MULTIBYTE (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8787 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8788 p = SDATA (string) + string_char_to_byte (string, from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8789 stop = pend = SDATA (string) + string_char_to_byte (string, to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8790 if (ascii_compatible && (to - from) == (pend - p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8791 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8792 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8793
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8794 if (NILP (count))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8795 n = 1;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8796 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8797 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8798 CHECK_NATNUM (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8799 n = XINT (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8800 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8801
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8802 positions = Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8803 while (1)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8804 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8805 int c;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8806
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8807 if (ascii_compatible)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8808 while (p < stop && ASCII_BYTE_P (*p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8809 p++, from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8810 if (p >= stop)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8811 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8812 if (p >= pend)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8813 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8814 stop = pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8815 p = GAP_END_ADDR;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8816 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8817
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8818 c = STRING_CHAR_ADVANCE (p);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8819 if (! (ASCII_CHAR_P (c) && ascii_compatible)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8820 && ! char_charset (translate_char (translation_table, c),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8821 charset_list, NULL))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8822 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8823 positions = Fcons (make_number (from), positions);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8824 n--;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8825 if (n == 0)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8826 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8827 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8828
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8829 from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8830 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8831
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8832 return (NILP (count) ? Fcar (positions) : Fnreverse (positions));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8833 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8834
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8835
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8836 DEFUN ("check-coding-systems-region", Fcheck_coding_systems_region,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8837 Scheck_coding_systems_region, 3, 3, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8838 doc: /* Check if the region is encodable by coding systems.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8839
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8840 START and END are buffer positions specifying the region.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8841 CODING-SYSTEM-LIST is a list of coding systems to check.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8842
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8843 The value is an alist ((CODING-SYSTEM POS0 POS1 ...) ...), where
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8844 CODING-SYSTEM is a member of CODING-SYSTEM-LIST and can't encode the
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8845 whole region, POS0, POS1, ... are buffer positions where non-encodable
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8846 characters are found.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8847
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8848 If all coding systems in CODING-SYSTEM-LIST can encode the region, the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8849 value is nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8850
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8851 START may be a string. In that case, check if the string is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8852 encodable, and the value contains indices to the string instead of
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8853 buffer positions. END is ignored.
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8854
102058
4f60db600648 (Fcheck_coding_systems_region): Fix test for unibyte
Andreas Schwab <schwab@suse.de>
parents: 102055
diff changeset
8855 If the current buffer (or START if it is a string) is unibyte, the value
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8856 is nil. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
8857 (Lisp_Object start, Lisp_Object end, Lisp_Object coding_system_list)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8858 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8859 Lisp_Object list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8860 EMACS_INT start_byte, end_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8861 int pos;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8862 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8863 int c;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8864 Lisp_Object tail, elt, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8865
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8866 if (STRINGP (start))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8867 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8868 if (!STRING_MULTIBYTE (start)
102058
4f60db600648 (Fcheck_coding_systems_region): Fix test for unibyte
Andreas Schwab <schwab@suse.de>
parents: 102055
diff changeset
8869 || SCHARS (start) == SBYTES (start))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8870 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8871 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8872 end_byte = SBYTES (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8873 pos = 0;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8874 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8875 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8876 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8877 CHECK_NUMBER_COERCE_MARKER (start);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8878 CHECK_NUMBER_COERCE_MARKER (end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8879 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8880 args_out_of_range (start, end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8881 if (NILP (current_buffer->enable_multibyte_characters))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8882 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8883 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8884 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8885 if (XINT (end) - XINT (start) == end_byte - start_byte)
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8886 return Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8887
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8888 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8889 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8890 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8891 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8892 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8893 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8894 }
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8895 pos = XINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8896 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8897
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8898 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8899 for (tail = coding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8900 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8901 elt = XCAR (tail);
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8902 attrs = AREF (CODING_SYSTEM_SPEC (elt), 0);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8903 ASET (attrs, coding_attr_trans_tbl,
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8904 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8905 list = Fcons (Fcons (elt, Fcons (attrs, Qnil)), list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8906 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8907
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8908 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8909 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8910 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8911 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8912 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8913
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8914 while (p < pend && ASCII_BYTE_P (*p)) p++, pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8915 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8916
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8917 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8918 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8919 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8920 p++;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8921 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8922 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8923 c = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8924
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8925 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8926 for (tail = list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8927 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8928 elt = XCDR (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8929 if (! char_encodable_p (c, XCAR (elt)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8930 XSETCDR (elt, Fcons (make_number (pos), XCDR (elt)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8931 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8932 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8933 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8934 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8935
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8936 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8937 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8938 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8939 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8940 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8941 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8942 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8943 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8944 pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8945 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8946
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8947 tail = list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8948 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8949 for (; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8950 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8951 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8952 if (CONSP (XCDR (XCDR (elt))))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8953 list = Fcons (Fcons (XCAR (elt), Fnreverse (XCDR (XCDR (elt)))),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8954 list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8955 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8956
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8957 return list;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8958 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8959
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8960
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8961 Lisp_Object
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8962 code_convert_region (Lisp_Object start, Lisp_Object end,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8963 Lisp_Object coding_system, Lisp_Object dst_object,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
8964 int encodep, int norecord)
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8965 {
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8966 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8967 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8968 Lisp_Object src_object;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8969
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8970 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8971 CHECK_NUMBER_COERCE_MARKER (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8972 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8973 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8974 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8975 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8976 src_object = Fcurrent_buffer ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8977 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8978 dst_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8979 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8980 CHECK_BUFFER (dst_object);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8981
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8982 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8983 from = XFASTINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8984 from_byte = CHAR_TO_BYTE (from);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8985 to = XFASTINT (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8986 to_byte = CHAR_TO_BYTE (to);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8987
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8988 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8989 coding.mode |= CODING_MODE_LAST_BLOCK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8990
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8991 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8992 encode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8993 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8994 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8995 decode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8996 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8997 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8998 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8999
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9000 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9001 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9002 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9003 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9004
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9005
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9006 DEFUN ("decode-coding-region", Fdecode_coding_region, Sdecode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9007 3, 4, "r\nzCoding system: ",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9008 doc: /* Decode the current region from the specified coding system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9009 When called from a program, takes four arguments:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9010 START, END, CODING-SYSTEM, and DESTINATION.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9011 START and END are buffer positions.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9012
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9013 Optional 4th arguments DESTINATION specifies where the decoded text goes.
91083
ff87badce376 (Fdecode_coding_region): Fix typo in docstring.
Kenichi Handa <handa@m17n.org>
parents: 91056
diff changeset
9014 If nil, the region between START and END is replaced by the decoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9015 If buffer, the decoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9016 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
9017 In those cases, the length of the decoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9018 If DESTINATION is t, the decoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9019
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9020 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9021 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9022 not fully specified.) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9023 (Lisp_Object start, Lisp_Object end, Lisp_Object coding_system, Lisp_Object destination)
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9024 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9025 return code_convert_region (start, end, coding_system, destination, 0, 0);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9026 }
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9027
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9028 DEFUN ("encode-coding-region", Fencode_coding_region, Sencode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9029 3, 4, "r\nzCoding system: ",
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9030 doc: /* Encode the current region by specified coding system.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9031 When called from a program, takes four arguments:
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9032 START, END, CODING-SYSTEM and DESTINATION.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9033 START and END are buffer positions.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9034
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9035 Optional 4th arguments DESTINATION specifies where the encoded text goes.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9036 If nil, the region between START and END is replace by the encoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9037 If buffer, the encoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9038 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
9039 In those cases, the length of the encoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9040 If DESTINATION is t, the encoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9041
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9042 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9043 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9044 not fully specified.) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9045 (Lisp_Object start, Lisp_Object end, Lisp_Object coding_system, Lisp_Object destination)
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9046 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9047 return code_convert_region (start, end, coding_system, destination, 1, 0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9048 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9049
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9050 Lisp_Object
109360
f37b85834f7e Convert more function definitions to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109179
diff changeset
9051 code_convert_string (Lisp_Object string, Lisp_Object coding_system,
f37b85834f7e Convert more function definitions to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109179
diff changeset
9052 Lisp_Object dst_object, int encodep, int nocopy, int norecord)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9053 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9054 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9055 EMACS_INT chars, bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9056
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9057 CHECK_STRING (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9058 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9059 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9060 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9061 Vlast_coding_system_used = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9062 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9063 return (nocopy ? Fcopy_sequence (string) : string);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9064 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9065
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
9066 if (NILP (coding_system))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9067 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9068 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9069 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9070 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9071 dst_object = Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9072 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9073 CHECK_BUFFER (dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9074
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9075 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9076 coding.mode |= CODING_MODE_LAST_BLOCK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9077 chars = SCHARS (string);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9078 bytes = SBYTES (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9079 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9080 encode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9081 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9082 decode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9083 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9084 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9085
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9086 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9087 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9088 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9089 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9090
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9091
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9092 /* Encode or decode STRING according to CODING_SYSTEM.
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9093 Do not set Vlast_coding_system_used.
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9094
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9095 This function is called only from macros DECODE_FILE and
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9096 ENCODE_FILE, thus we ignore character composition. */
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9097
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9098 Lisp_Object
109159
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
9099 code_convert_string_norecord (Lisp_Object string, Lisp_Object coding_system,
3e9fdeb960d1 * coding.c, sysdep.c: Convert some more functions to standard C.
Juanma Barranquero <lekktu@gmail.com>
parents: 109158
diff changeset
9100 int encodep)
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9101 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
9102 return code_convert_string (string, coding_system, Qt, encodep, 0, 1);
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9103 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9104
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9105
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9106 DEFUN ("decode-coding-string", Fdecode_coding_string, Sdecode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9107 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9108 doc: /* Decode STRING which is encoded in CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9109
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9110 Optional third arg NOCOPY non-nil means it is OK to return STRING itself
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9111 if the decoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9112
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9113 Optional fourth arg BUFFER non-nil means that the decoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9114 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9115 case, the return value is the length of the decoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9116
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9117 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9118 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9119 not fully specified.) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9120 (Lisp_Object string, Lisp_Object coding_system, Lisp_Object nocopy, Lisp_Object buffer)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9121 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9122 return code_convert_string (string, coding_system, buffer,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9123 0, ! NILP (nocopy), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9124 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9125
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9126 DEFUN ("encode-coding-string", Fencode_coding_string, Sencode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9127 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9128 doc: /* Encode STRING to CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9129
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9130 Optional third arg NOCOPY non-nil means it is OK to return STRING
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9131 itself if the encoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9132
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9133 Optional fourth arg BUFFER non-nil means that the encoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9134 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9135 case, the return value is the length of the encoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9136
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9137 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9138 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9139 not fully specified.) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9140 (Lisp_Object string, Lisp_Object coding_system, Lisp_Object nocopy, Lisp_Object buffer)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9141 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9142 return code_convert_string (string, coding_system, buffer,
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
9143 1, ! NILP (nocopy), 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9144 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9145
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9146
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9147 DEFUN ("decode-sjis-char", Fdecode_sjis_char, Sdecode_sjis_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9148 doc: /* Decode a Japanese character which has CODE in shift_jis encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9149 Return the corresponding character. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9150 (Lisp_Object code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9151 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9152 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9153 struct charset *charset_roman, *charset_kanji, *charset_kana, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9154 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9155
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9156 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9157 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9158 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9159 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9160
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9161 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9162 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9163 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9164
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9165 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9166 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9167 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9168 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9169
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9170 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9171 charset = charset_roman;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9172 else if (c >= 0xA0 && c < 0xDF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9173 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9174 charset = charset_kana;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9175 c -= 0x80;
24065
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9176 }
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9177 else
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9178 {
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9179 int s1 = c >> 8, s2 = c & 0xFF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9180
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9181 if (s1 < 0x81 || (s1 > 0x9F && s1 < 0xE0) || s1 > 0xEF
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9182 || s2 < 0x40 || s2 == 0x7F || s2 > 0xFC)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9183 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9184 SJIS_TO_JIS (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9185 charset = charset_kanji;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9186 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9187 c = DECODE_CHAR (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9188 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9189 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9190 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9191 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9192
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9193
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9194 DEFUN ("encode-sjis-char", Fencode_sjis_char, Sencode_sjis_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
9195 doc: /* Encode a Japanese character CH to shift_jis encoding.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9196 Return the corresponding code in SJIS. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9197 (Lisp_Object ch)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9198 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9199 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9200 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9201 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9202 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9203
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9204 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9205 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9206 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9207 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9208
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9209 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9210 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9211 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9212
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9213 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9214 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9215 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9216 error ("Can't encode by shift_jis encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9217 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9218
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9219 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9220 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9221
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9222 DEFUN ("decode-big5-char", Fdecode_big5_char, Sdecode_big5_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9223 doc: /* Decode a Big5 character which has CODE in BIG5 coding system.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9224 Return the corresponding character. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9225 (Lisp_Object code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9226 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9227 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9228 struct charset *charset_roman, *charset_big5, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9229 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9230
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9231 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9232 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9233 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9234 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9235
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9236 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9237 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9238 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9239
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9240 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9241 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9242 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9243
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9244 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9245 charset = charset_roman;
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
9246 else
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
9247 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9248 int b1 = c >> 8, b2 = c & 0x7F;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9249 if (b1 < 0xA1 || b1 > 0xFE
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9250 || b2 < 0x40 || (b2 > 0x7E && b2 < 0xA1) || b2 > 0xFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9251 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9252 charset = charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9253 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9254 c = DECODE_CHAR (charset, (unsigned )c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9255 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9256 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9257 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9258 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9259
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9260 DEFUN ("encode-big5-char", Fencode_big5_char, Sencode_big5_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
9261 doc: /* Encode the Big5 character CH to BIG5 coding system.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9262 Return the corresponding character code in Big5. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9263 (Lisp_Object ch)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9264 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9265 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9266 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9267 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9268 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9269
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9270 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9271 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9272 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9273 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9274 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9275 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9276 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9277
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9278 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9279 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9280 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9281 error ("Can't encode by Big5 encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9282
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9283 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9284 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9285
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9286
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9287 DEFUN ("set-terminal-coding-system-internal", Fset_terminal_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9288 Sset_terminal_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9289 doc: /* Internal use only. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9290 (Lisp_Object coding_system, Lisp_Object terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9291 {
111237
6788b08ca420 Handle glyphless characters on tty.
Kenichi Handa <handa@m17n.org>
parents: 110997
diff changeset
9292 struct terminal *term = get_terminal (terminal, 1);
6788b08ca420 Handle glyphless characters on tty.
Kenichi Handa <handa@m17n.org>
parents: 110997
diff changeset
9293 struct coding_system *terminal_coding = TERMINAL_TERMINAL_CODING (term);
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9294 CHECK_SYMBOL (coding_system);
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9295 setup_coding_system (Fcheck_coding_system (coding_system), terminal_coding);
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
9296 /* We had better not send unsafe characters to terminal. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9297 terminal_coding->mode |= CODING_MODE_SAFE_ENCODING;
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
9298 /* Character composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9299 terminal_coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9300 terminal_coding->src_multibyte = 1;
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9301 terminal_coding->dst_multibyte = 0;
111237
6788b08ca420 Handle glyphless characters on tty.
Kenichi Handa <handa@m17n.org>
parents: 110997
diff changeset
9302 if (terminal_coding->common_flags & CODING_REQUIRE_ENCODING_MASK)
6788b08ca420 Handle glyphless characters on tty.
Kenichi Handa <handa@m17n.org>
parents: 110997
diff changeset
9303 term->charset_list = coding_charset_list (terminal_coding);
6788b08ca420 Handle glyphless characters on tty.
Kenichi Handa <handa@m17n.org>
parents: 110997
diff changeset
9304 else
111575
c1042b16fa46 coding.c (Fset_terminal_coding_system_internal): Fix previous change (set charset-ID list instead of charset-symbol list).
Kenichi Handa <handa@m17n.org>
parents: 111402
diff changeset
9305 term->charset_list = Fcons (make_number (charset_ascii), Qnil);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9306 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9307 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9308
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9309 DEFUN ("set-safe-terminal-coding-system-internal",
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9310 Fset_safe_terminal_coding_system_internal,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9311 Sset_safe_terminal_coding_system_internal, 1, 1, 0,
41006
fd83ec62a495 Doc fix.
Pavel Janík <Pavel@Janik.cz>
parents: 40842
diff changeset
9312 doc: /* Internal use only. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9313 (Lisp_Object coding_system)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9314 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9315 CHECK_SYMBOL (coding_system);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9316 setup_coding_system (Fcheck_coding_system (coding_system),
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9317 &safe_terminal_coding);
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
9318 /* Character composition should be disabled. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9319 safe_terminal_coding.common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9320 safe_terminal_coding.src_multibyte = 1;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9321 safe_terminal_coding.dst_multibyte = 0;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9322 return Qnil;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9323 }
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9324
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9325 DEFUN ("terminal-coding-system", Fterminal_coding_system,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9326 Sterminal_coding_system, 0, 1, 0,
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9327 doc: /* Return coding system specified for terminal output on the given terminal.
103052
e68707cf48a5 * keyboard.c (Fset_input_meta_mode): Doc fix.
Chong Yidong <cyd@stupidchicken.com>
parents: 103035
diff changeset
9328 TERMINAL may be a terminal object, a frame, or nil for the selected
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9329 frame's terminal device. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9330 (Lisp_Object terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9331 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9332 struct coding_system *terminal_coding
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9333 = TERMINAL_TERMINAL_CODING (get_terminal (terminal, 1));
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9334 Lisp_Object coding_system = CODING_ID_NAME (terminal_coding->id);
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9335
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
9336 /* For backward compatibility, return nil if it is `undecided'. */
90359
041f75914d0c (produce_composition): Compare charbuf[i] instead of
Kenichi Handa <handa@m17n.org>
parents: 90354
diff changeset
9337 return (! EQ (coding_system, Qundecided) ? coding_system : Qnil);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9338 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9339
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9340 DEFUN ("set-keyboard-coding-system-internal", Fset_keyboard_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9341 Sset_keyboard_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9342 doc: /* Internal use only. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9343 (Lisp_Object coding_system, Lisp_Object terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9344 {
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9345 struct terminal *t = get_terminal (terminal, 1);
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9346 CHECK_SYMBOL (coding_system);
103655
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
9347 if (NILP (coding_system))
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
9348 coding_system = Qno_conversion;
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
9349 else
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
9350 Fcheck_coding_system (coding_system);
e2d67c929da2 (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 103486
diff changeset
9351 setup_coding_system (coding_system, TERMINAL_KEYBOARD_CODING (t));
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
9352 /* Character composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9353 TERMINAL_KEYBOARD_CODING (t)->common_flags
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9354 &= ~CODING_ANNOTATE_COMPOSITION_MASK;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9355 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9356 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9357
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9358 DEFUN ("keyboard-coding-system",
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9359 Fkeyboard_coding_system, Skeyboard_coding_system, 0, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9360 doc: /* Return coding system specified for decoding keyboard input. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9361 (Lisp_Object terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9362 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9363 return CODING_ID_NAME (TERMINAL_KEYBOARD_CODING
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9364 (get_terminal (terminal, 1))->id);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9365 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9366
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9367
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
9368 DEFUN ("find-operation-coding-system", Ffind_operation_coding_system,
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
9369 Sfind_operation_coding_system, 1, MANY, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9370 doc: /* Choose a coding system for an operation based on the target name.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9371 The value names a pair of coding systems: (DECODING-SYSTEM . ENCODING-SYSTEM).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9372 DECODING-SYSTEM is the coding system to use for decoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9373 \(in case OPERATION does decoding), and ENCODING-SYSTEM is the coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9374 for encoding (in case OPERATION does encoding).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9375
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9376 The first argument OPERATION specifies an I/O primitive:
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9377 For file I/O, `insert-file-contents' or `write-region'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9378 For process I/O, `call-process', `call-process-region', or `start-process'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9379 For network I/O, `open-network-stream'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9380
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9381 The remaining arguments should be the same arguments that were passed
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9382 to the primitive. Depending on which primitive, one of those arguments
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9383 is selected as the TARGET. For example, if OPERATION does file I/O,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9384 whichever argument specifies the file name is TARGET.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9385
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9386 TARGET has a meaning which depends on OPERATION:
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9387 For file I/O, TARGET is a file name (except for the special case below).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9388 For process I/O, TARGET is a process name.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9389 For network I/O, TARGET is a service name or a port number.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9390
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9391 This function looks up what is specified for TARGET in
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9392 `file-coding-system-alist', `process-coding-system-alist',
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9393 or `network-coding-system-alist' depending on OPERATION.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9394 They may specify a coding system, a cons of coding systems,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9395 or a function symbol to call.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9396 In the last case, we call the function with one argument,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9397 which is a list of all the arguments given to this function.
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
9398 If the function can't decide a coding system, it can return
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
9399 `undecided' so that the normal code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9400
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9401 If OPERATION is `insert-file-contents', the argument corresponding to
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9402 TARGET may be a cons (FILENAME . BUFFER). In that case, FILENAME is a
71084
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
9403 file name to look up, and BUFFER is a buffer that contains the file's
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
9404 contents (not yet decoded). If `file-coding-system-alist' specifies a
71070
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
9405 function to call for FILENAME, that function should examine the
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
9406 contents of BUFFER instead of reading the file.
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9407
78152
5e5f359984e5 (Ffind_operation_coding_system): Doc fix.
Juanma Barranquero <lekktu@gmail.com>
parents: 75348
diff changeset
9408 usage: (find-operation-coding-system OPERATION ARGUMENTS...) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9409 (int nargs, Lisp_Object *args)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9410 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9411 Lisp_Object operation, target_idx, target, val;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9412 register Lisp_Object chain;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9413
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9414 if (nargs < 2)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9415 error ("Too few arguments");
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9416 operation = args[0];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9417 if (!SYMBOLP (operation)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9418 || !INTEGERP (target_idx = Fget (operation, Qtarget_idx)))
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
9419 error ("Invalid first argument");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9420 if (nargs < 1 + XINT (target_idx))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9421 error ("Too few arguments for operation: %s",
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
9422 SDATA (SYMBOL_NAME (operation)));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9423 target = args[XINT (target_idx) + 1];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9424 if (!(STRINGP (target)
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9425 || (EQ (operation, Qinsert_file_contents) && CONSP (target)
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9426 && STRINGP (XCAR (target)) && BUFFERP (XCDR (target)))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9427 || (EQ (operation, Qopen_network_stream) && INTEGERP (target))))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9428 error ("Invalid %dth argument", XINT (target_idx) + 1);
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9429 if (CONSP (target))
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9430 target = XCAR (target);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9431
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9432 chain = ((EQ (operation, Qinsert_file_contents)
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9433 || EQ (operation, Qwrite_region))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9434 ? Vfile_coding_system_alist
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9435 : (EQ (operation, Qopen_network_stream)
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9436 ? Vnetwork_coding_system_alist
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9437 : Vprocess_coding_system_alist));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9438 if (NILP (chain))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9439 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9440
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9441 for (; CONSP (chain); chain = XCDR (chain))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9442 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
9443 Lisp_Object elt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9444
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9445 elt = XCAR (chain);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9446 if (CONSP (elt)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9447 && ((STRINGP (target)
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9448 && STRINGP (XCAR (elt))
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9449 && fast_string_match (XCAR (elt), target) >= 0)
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9450 || (INTEGERP (target) && EQ (target, XCAR (elt)))))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9451 {
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9452 val = XCDR (elt);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9453 /* Here, if VAL is both a valid coding system and a valid
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9454 function symbol, we return VAL as a coding system. */
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9455 if (CONSP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9456 return val;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9457 if (! SYMBOLP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9458 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9459 if (! NILP (Fcoding_system_p (val)))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9460 return Fcons (val, val);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9461 if (! NILP (Ffboundp (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9462 {
72188
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9463 /* We use call1 rather than safe_call1
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9464 so as to get bug reports about functions called here
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9465 which don't handle the current interface. */
72180
f3bc55b96df5 (Ffind_operation_coding_system): Revert the change from 2006-05-29.
Eli Zaretskii <eliz@gnu.org>
parents: 71972
diff changeset
9466 val = call1 (val, Flist (nargs, args));
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9467 if (CONSP (val))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9468 return val;
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9469 if (SYMBOLP (val) && ! NILP (Fcoding_system_p (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9470 return Fcons (val, val);
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9471 }
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9472 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9473 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9474 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9475 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9476 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9477
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9478 DEFUN ("set-coding-system-priority", Fset_coding_system_priority,
88845
64b8f6168269 (Fset_coding_system_priority): Allow null arg list.
Dave Love <fx@gnu.org>
parents: 88771
diff changeset
9479 Sset_coding_system_priority, 0, MANY, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9480 doc: /* Assign higher priority to the coding systems given as arguments.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9481 If multiple coding systems belong to the same category,
89519
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
9482 all but the first one are ignored.
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
9483
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9484 usage: (set-coding-system-priority &rest coding-systems) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9485 (int nargs, Lisp_Object *args)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9486 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9487 int i, j;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9488 int changed[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9489 enum coding_category priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9490
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
9491 memset (changed, 0, sizeof changed);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9492
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9493 for (i = j = 0; i < nargs; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9494 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9495 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9496 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9497
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9498 CHECK_CODING_SYSTEM_GET_SPEC (args[i], spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9499 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9500 category = XINT (CODING_ATTR_CATEGORY (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9501 if (changed[category])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9502 /* Ignore this coding system because a coding system of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9503 same category already had a higher priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9504 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9505 changed[category] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9506 priorities[j++] = category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9507 if (coding_categories[category].id >= 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9508 && ! EQ (args[i], CODING_ID_NAME (coding_categories[category].id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9509 setup_coding_system (args[i], &coding_categories[category]);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9510 Fset (AREF (Vcoding_category_table, category), args[i]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9511 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9512
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9513 /* Now we have decided top J priorities. Reflect the order of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9514 original priorities to the remaining priorities. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9515
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9516 for (i = j, j = 0; i < coding_category_max; i++, j++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9517 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9518 while (j < coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9519 && changed[coding_priorities[j]])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9520 j++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9521 if (j == coding_category_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9522 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9523 priorities[i] = coding_priorities[j];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9524 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9525
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
9526 memcpy (coding_priorities, priorities, sizeof priorities);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9527
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9528 /* Update `coding-category-list'. */
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9529 Vcoding_category_list = Qnil;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9530 for (i = coding_category_max - 1; i >= 0; i--)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9531 Vcoding_category_list
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9532 = Fcons (AREF (Vcoding_category_table, priorities[i]),
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9533 Vcoding_category_list);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9534
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9535 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9536 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9537
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9538 DEFUN ("coding-system-priority-list", Fcoding_system_priority_list,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9539 Scoding_system_priority_list, 0, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9540 doc: /* Return a list of coding systems ordered by their priorities.
102737
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9541 The list contains a subset of coding systems; i.e. coding systems
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9542 assigned to each coding category (see `coding-category-list').
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9543
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9544 HIGHESTP non-nil means just return the highest priority one. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9545 (Lisp_Object highestp)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9546 {
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9547 int i;
22954
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9548 Lisp_Object val;
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9549
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9550 for (i = 0, val = Qnil; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9551 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9552 enum coding_category category = coding_priorities[i];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9553 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9554 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9555
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9556 if (id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9557 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9558 attrs = CODING_ID_ATTRS (id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9559 if (! NILP (highestp))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9560 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9561 val = Fcons (CODING_ATTR_BASE_NAME (attrs), val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9562 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9563 return Fnreverse (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9564 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9565
105959
ba3ffbd9c422 * process.c (ifflag_def): Make flag_sym constant.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105877
diff changeset
9566 static const char *const suffixes[] = { "-unix", "-dos", "-mac" };
88631
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
9567
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9568 static Lisp_Object
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
9569 make_subsidiaries (Lisp_Object base)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9570 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9571 Lisp_Object subsidiaries;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9572 int base_name_len = SBYTES (SYMBOL_NAME (base));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9573 char *buf = (char *) alloca (base_name_len + 6);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9574 int i;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9575
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
9576 memcpy (buf, SDATA (SYMBOL_NAME (base)), base_name_len);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9577 subsidiaries = Fmake_vector (make_number (3), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9578 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9579 {
109165
750db9f3e6d8 Replace bcopy, bzero, bcmp by memcpy, memmove, memset, memcmp
Andreas Schwab <schwab@linux-m68k.org>
parents: 109159
diff changeset
9580 memcpy (buf + base_name_len, suffixes[i], strlen (suffixes[i]) + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9581 ASET (subsidiaries, i, intern (buf));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9582 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9583 return subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9584 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9585
22226
557fac086b1b (ascii_skip_code): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22186
diff changeset
9586
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9587 DEFUN ("define-coding-system-internal", Fdefine_coding_system_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9588 Sdefine_coding_system_internal, coding_arg_max, MANY, 0,
88544
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9589 doc: /* For internal use only.
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9590 usage: (define-coding-system-internal ...) */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
9591 (int nargs, Lisp_Object *args)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9592 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9593 Lisp_Object name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9594 Lisp_Object spec_vec; /* [ ATTRS ALIASE EOL_TYPE ] */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9595 Lisp_Object attrs; /* Vector of attributes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9596 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9597 Lisp_Object aliases;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9598 Lisp_Object coding_type, charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9599 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9600 Lisp_Object tail, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9601 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9602 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9603
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9604 if (nargs < coding_arg_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9605 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9606
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9607 attrs = Fmake_vector (make_number (coding_attr_last_index), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9608
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9609 name = args[coding_arg_name];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9610 CHECK_SYMBOL (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9611 CODING_ATTR_BASE_NAME (attrs) = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9612
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9613 val = args[coding_arg_mnemonic];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9614 if (! STRINGP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9615 CHECK_CHARACTER (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9616 CODING_ATTR_MNEMONIC (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9617
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9618 coding_type = args[coding_arg_coding_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9619 CHECK_SYMBOL (coding_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9620 CODING_ATTR_TYPE (attrs) = coding_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9621
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9622 charset_list = args[coding_arg_charset_list];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9623 if (SYMBOLP (charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9624 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9625 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9626 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9627 if (! EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9628 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9629 charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9630 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9631 else if (EQ (charset_list, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9632 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9633 if (! EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9634 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9635 charset_list = Vemacs_mule_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9636 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9637 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9638 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9639 max_charset_id = XFASTINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9640 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9641 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9642 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9643 charset_list = Fcopy_sequence (charset_list);
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9644 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9645 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9646 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9647
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9648 val = XCAR (tail);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9649 CHECK_CHARSET_GET_CHARSET (val, charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9650 if (EQ (coding_type, Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9651 ? CHARSET_ISO_FINAL (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9652 : EQ (coding_type, Qemacs_mule)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9653 ? CHARSET_EMACS_MULE_ID (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9654 : 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9655 error ("Can't handle charset `%s'",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9656 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9657
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9658 XSETCAR (tail, make_number (charset->id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9659 if (max_charset_id < charset->id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9660 max_charset_id = charset->id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9661 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9662 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9663 CODING_ATTR_CHARSET_LIST (attrs) = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9664
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
9665 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
9666 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9667 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9668 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9669 CODING_ATTR_SAFE_CHARSETS (attrs) = safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9670
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9671 CODING_ATTR_ASCII_COMPAT (attrs) = args[coding_arg_ascii_compatible_p];
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9672
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9673 val = args[coding_arg_decode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9674 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9675 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9676 CODING_ATTR_DECODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9677
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9678 val = args[coding_arg_encode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9679 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9680 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9681 CODING_ATTR_ENCODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9682
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9683 val = args[coding_arg_post_read_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9684 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9685 CODING_ATTR_POST_READ (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9686
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9687 val = args[coding_arg_pre_write_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9688 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9689 CODING_ATTR_PRE_WRITE (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9691 val = args[coding_arg_default_char];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9692 if (NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9693 CODING_ATTR_DEFAULT_CHAR (attrs) = make_number (' ');
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9694 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9695 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9696 CHECK_CHARACTER (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9697 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9698 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9699
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9700 val = args[coding_arg_for_unibyte];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9701 CODING_ATTR_FOR_UNIBYTE (attrs) = NILP (val) ? Qnil : Qt;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9702
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9703 val = args[coding_arg_plist];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9704 CHECK_LIST (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9705 CODING_ATTR_PLIST (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9706
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9707 if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9708 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9709 /* Generate a lisp vector of 256 elements. Each element is nil,
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9710 integer, or a list of charset IDs.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9711
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9712 If Nth element is nil, the byte code N is invalid in this
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9713 coding system.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9714
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9715 If Nth element is a number NUM, N is the first byte of a
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9716 charset whose ID is NUM.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9717
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9718 If Nth element is a list of charset IDs, N is the first byte
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9719 of one of them. The list is sorted by dimensions of the
110983
b87d8337c695 Fix typos in comments
Kenichi Handa <handa@m17n.org>
parents: 110847
diff changeset
9720 charsets. A charset of smaller dimension comes first. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9721 val = Fmake_vector (make_number (256), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9722
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9723 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9724 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9725 struct charset *charset = CHARSET_FROM_ID (XFASTINT (XCAR (tail)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9726 int dim = CHARSET_DIMENSION (charset);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9727 int idx = (dim - 1) * 4;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9728
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9729 if (CHARSET_ASCII_COMPATIBLE_P (charset))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9730 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9731
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9732 for (i = charset->code_space[idx];
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9733 i <= charset->code_space[idx + 1]; i++)
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9734 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9735 Lisp_Object tmp, tmp2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9736 int dim2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9737
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9738 tmp = AREF (val, i);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9739 if (NILP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9740 tmp = XCAR (tail);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9741 else if (NUMBERP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9742 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9743 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (tmp)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9744 if (dim < dim2)
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9745 tmp = Fcons (XCAR (tail), Fcons (tmp, Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9746 else
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9747 tmp = Fcons (tmp, Fcons (XCAR (tail), Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9748 }
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9749 else
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9750 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9751 for (tmp2 = tmp; CONSP (tmp2); tmp2 = XCDR (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9752 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9753 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (XCAR (tmp2))));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9754 if (dim < dim2)
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9755 break;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9756 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9757 if (NILP (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9758 tmp = nconc2 (tmp, Fcons (XCAR (tail), Qnil));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9759 else
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9760 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9761 XSETCDR (tmp2, Fcons (XCAR (tmp2), XCDR (tmp2)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9762 XSETCAR (tmp2, XCAR (tail));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9763 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9764 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9765 ASET (val, i, tmp);
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9766 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9767 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9768 ASET (attrs, coding_attr_charset_valids, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9769 category = coding_category_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9770 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9771 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9772 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9773 Lisp_Object valids;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9774
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9775 if (nargs < coding_arg_ccl_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9776 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9777
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9778 val = args[coding_arg_ccl_decoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9779 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9780 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9781 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9782 ASET (attrs, coding_attr_ccl_decoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9783
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9784 val = args[coding_arg_ccl_encoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9785 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9786 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9787 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9788 ASET (attrs, coding_attr_ccl_encoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9789
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9790 val = args[coding_arg_ccl_valids];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9791 valids = Fmake_string (make_number (256), make_number (0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9792 for (tail = val; !NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9793 {
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9794 int from, to;
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9795
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9796 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9797 if (INTEGERP (val))
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9798 {
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9799 from = to = XINT (val);
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9800 if (from < 0 || from > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9801 args_out_of_range_3 (val, make_number (0), make_number (255));
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9802 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9803 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9804 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9805 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9806 CHECK_NATNUM_CAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9807 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9808 from = XINT (XCAR (val));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9809 if (from > 255)
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9810 args_out_of_range_3 (XCAR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9811 make_number (0), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9812 to = XINT (XCDR (val));
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9813 if (to < from || to > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9814 args_out_of_range_3 (XCDR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9815 XCAR (val), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9816 }
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9817 for (i = from; i <= to; i++)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9818 SSET (valids, i, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9819 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9820 ASET (attrs, coding_attr_ccl_valids, valids);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9821
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9822 category = coding_category_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9823 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9824 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9825 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9826 Lisp_Object bom, endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9827
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9828 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9829
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9830 if (nargs < coding_arg_utf16_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9831 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9832
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9833 bom = args[coding_arg_utf16_bom];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9834 if (! NILP (bom) && ! EQ (bom, Qt))
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9835 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9836 CHECK_CONS (bom);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9837 val = XCAR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9838 CHECK_CODING_SYSTEM (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9839 val = XCDR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9840 CHECK_CODING_SYSTEM (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9841 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9842 ASET (attrs, coding_attr_utf_bom, bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9843
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9844 endian = args[coding_arg_utf16_endian];
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9845 CHECK_SYMBOL (endian);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9846 if (NILP (endian))
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9847 endian = Qbig;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9848 else if (! EQ (endian, Qbig) && ! EQ (endian, Qlittle))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9849 error ("Invalid endian: %s", SDATA (SYMBOL_NAME (endian)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9850 ASET (attrs, coding_attr_utf_16_endian, endian);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9851
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9852 category = (CONSP (bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9853 ? coding_category_utf_16_auto
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9854 : NILP (bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9855 ? (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9856 ? coding_category_utf_16_be_nosig
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9857 : coding_category_utf_16_le_nosig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9858 : (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9859 ? coding_category_utf_16_be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9860 : coding_category_utf_16_le));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9861 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9862 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9863 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9864 Lisp_Object initial, reg_usage, request, flags;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
9865 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9866
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9867 if (nargs < coding_arg_iso2022_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9868 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9869
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9870 initial = Fcopy_sequence (args[coding_arg_iso2022_initial]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9871 CHECK_VECTOR (initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9872 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9873 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9874 val = Faref (initial, make_number (i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9875 if (! NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9876 {
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9877 struct charset *charset;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9878
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9879 CHECK_CHARSET_GET_CHARSET (val, charset);
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9880 ASET (initial, i, make_number (CHARSET_ID (charset)));
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9881 if (i == 0 && CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9882 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9883 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9884 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9885 ASET (initial, i, make_number (-1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9886 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9887
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9888 reg_usage = args[coding_arg_iso2022_reg_usage];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9889 CHECK_CONS (reg_usage);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9890 CHECK_NUMBER_CAR (reg_usage);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9891 CHECK_NUMBER_CDR (reg_usage);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9892
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9893 request = Fcopy_sequence (args[coding_arg_iso2022_request]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9894 for (tail = request; ! NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9895 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9896 int id;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9897 Lisp_Object tmp;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9898
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9899 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9900 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9901 tmp = XCAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9902 CHECK_CHARSET_GET_ID (tmp, id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9903 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9904 if (XINT (XCDR (val)) >= 4)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9905 error ("Invalid graphic register number: %d", XINT (XCDR (val)));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9906 XSETCAR (val, make_number (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9907 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9908
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9909 flags = args[coding_arg_iso2022_flags];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9910 CHECK_NATNUM (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9911 i = XINT (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9912 if (EQ (args[coding_arg_charset_list], Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9913 flags = make_number (i | CODING_ISO_FLAG_FULL_SUPPORT);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9914
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9915 ASET (attrs, coding_attr_iso_initial, initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9916 ASET (attrs, coding_attr_iso_usage, reg_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9917 ASET (attrs, coding_attr_iso_request, request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9918 ASET (attrs, coding_attr_iso_flags, flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9919 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9920
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9921 if (i & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9922 category = ((i & (CODING_ISO_FLAG_LOCKING_SHIFT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9923 | CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9924 ? coding_category_iso_7_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9925 : EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9926 ? coding_category_iso_7
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9927 : coding_category_iso_7_tight);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9928 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9929 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9930 int id = XINT (AREF (initial, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9931
88977
3b05c02eebf2 (Fdefine_coding_system_internal): Fix category setting
Kenichi Handa <handa@m17n.org>
parents: 88950
diff changeset
9932 category = (((i & CODING_ISO_FLAG_LOCKING_SHIFT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9933 || EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9934 || id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9935 ? coding_category_iso_8_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9936 : (CHARSET_DIMENSION (CHARSET_FROM_ID (id)) == 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9937 ? coding_category_iso_8_1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9938 : coding_category_iso_8_2);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9939 }
89227
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9940 if (category != coding_category_iso_8_1
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9941 && category != coding_category_iso_8_2)
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9942 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9943 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9944 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9945 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9946 if (EQ (args[coding_arg_charset_list], Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9947 ASET (attrs, coding_attr_emacs_mule_full, Qt);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9948 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9949 category = coding_category_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9950 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9951 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9952 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9953
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9954 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9955
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9956 if (XINT (Flength (charset_list)) != 3
89739
293c9235be3f (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89732
diff changeset
9957 && XINT (Flength (charset_list)) != 4)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9958 error ("There should be three or four charsets");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9959
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9960 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9961 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9962 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9963 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9964 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9965 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9966
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9967 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9968 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9969 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9970 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9971 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9972
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9973 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9974 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9975 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9976 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9977 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9978
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9979 charset_list = XCDR (charset_list);
89740
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9980 if (! NILP (charset_list))
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9981 {
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9982 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9983 if (CHARSET_DIMENSION (charset) != 2)
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9984 error ("Dimension of charset %s is not two",
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9985 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9986 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9987
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9988 category = coding_category_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9989 Vsjis_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9990 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9991 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9992 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9993 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9994
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9995 if (XINT (Flength (charset_list)) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9996 error ("There should be just two charsets");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9997
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9998 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9999 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10000 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10001 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10002 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10003 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10005 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10006 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10007 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10008 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10009 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10010
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10011 category = coding_category_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10012 Vbig5_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10013 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10014 else if (EQ (coding_type, Qraw_text))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10015 {
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10016 category = coding_category_raw_text;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10017 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10018 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10019 else if (EQ (coding_type, Qutf_8))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10020 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10021 Lisp_Object bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10022
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10023 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10024
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10025 if (nargs < coding_arg_utf8_max)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10026 goto short_args;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10027
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10028 bom = args[coding_arg_utf8_bom];
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10029 if (! NILP (bom) && ! EQ (bom, Qt))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10030 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10031 CHECK_CONS (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10032 val = XCAR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10033 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10034 val = XCDR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10035 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10036 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10037 ASET (attrs, coding_attr_utf_bom, bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10038
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10039 category = (CONSP (bom) ? coding_category_utf_8_auto
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10040 : NILP (bom) ? coding_category_utf_8_nosig
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10041 : coding_category_utf_8_sig);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10042 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10043 else if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10044 category = coding_category_undecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10045 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10046 error ("Invalid coding system type: %s",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10047 SDATA (SYMBOL_NAME (coding_type)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10048
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10049 CODING_ATTR_CATEGORY (attrs) = make_number (category);
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10050 CODING_ATTR_PLIST (attrs)
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10051 = Fcons (QCcategory, Fcons (AREF (Vcoding_category_table, category),
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10052 CODING_ATTR_PLIST (attrs)));
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10053 CODING_ATTR_PLIST (attrs)
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
10054 = Fcons (QCascii_compatible_p,
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10055 Fcons (CODING_ATTR_ASCII_COMPAT (attrs),
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10056 CODING_ATTR_PLIST (attrs)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10057
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10058 eol_type = args[coding_arg_eol_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10059 if (! NILP (eol_type)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10060 && ! EQ (eol_type, Qunix)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10061 && ! EQ (eol_type, Qdos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10062 && ! EQ (eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10063 error ("Invalid eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10064
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10065 aliases = Fcons (name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10066
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10067 if (NILP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10068 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10069 eol_type = make_subsidiaries (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10070 for (i = 0; i < 3; i++)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10071 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10072 Lisp_Object this_spec, this_name, this_aliases, this_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10073
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10074 this_name = AREF (eol_type, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10075 this_aliases = Fcons (this_name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10076 this_eol_type = (i == 0 ? Qunix : i == 1 ? Qdos : Qmac);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10077 this_spec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10078 ASET (this_spec, 1, this_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10079 ASET (this_spec, 2, this_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10080 Fputhash (this_name, this_spec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10081 Vcoding_system_list = Fcons (this_name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10082 val = Fassoc (Fsymbol_name (this_name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10083 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10084 Vcoding_system_alist
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10085 = Fcons (Fcons (Fsymbol_name (this_name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10086 Vcoding_system_alist);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10087 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10088 }
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10089
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10090 spec_vec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10091 ASET (spec_vec, 1, aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10092 ASET (spec_vec, 2, eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10093
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10094 Fputhash (name, spec_vec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10095 Vcoding_system_list = Fcons (name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10096 val = Fassoc (Fsymbol_name (name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10097 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10098 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10099 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10101 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10102 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10103
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10104 if (id < 0 || EQ (name, CODING_ID_NAME (id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10105 setup_coding_system (name, &coding_categories[category]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10106 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10107
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10108 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10109
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10110 short_args:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10111 return Fsignal (Qwrong_number_of_arguments,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10112 Fcons (intern ("define-coding-system-internal"),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10113 make_number (nargs)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10114 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10115
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10116
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10117 DEFUN ("coding-system-put", Fcoding_system_put, Scoding_system_put,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10118 3, 3, 0,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10119 doc: /* Change value in CODING-SYSTEM's property list PROP to VAL. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10120 (Lisp_Object coding_system, Lisp_Object prop, Lisp_Object val)
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10121 {
89924
7d0f6da3ea6e (detect_coding): Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 89917
diff changeset
10122 Lisp_Object spec, attrs;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10123
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10124 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10125 attrs = AREF (spec, 0);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10126 if (EQ (prop, QCmnemonic))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10127 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10128 if (! STRINGP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10129 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10130 CODING_ATTR_MNEMONIC (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10131 }
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
10132 else if (EQ (prop, QCdefault_char))
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10133 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10134 if (NILP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10135 val = make_number (' ');
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10136 else
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10137 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10138 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10139 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10140 else if (EQ (prop, QCdecode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10141 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10142 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10143 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10144 CODING_ATTR_DECODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10145 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10146 else if (EQ (prop, QCencode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10147 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10148 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10149 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10150 CODING_ATTR_ENCODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10151 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10152 else if (EQ (prop, QCpost_read_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10153 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10154 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10155 CODING_ATTR_POST_READ (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10156 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10157 else if (EQ (prop, QCpre_write_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10158 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10159 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10160 CODING_ATTR_PRE_WRITE (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10161 }
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10162 else if (EQ (prop, QCascii_compatible_p))
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10163 {
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10164 CODING_ATTR_ASCII_COMPAT (attrs) = val;
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10165 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10166
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10167 CODING_ATTR_PLIST (attrs)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10168 = Fplist_put (CODING_ATTR_PLIST (attrs), prop, val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10169 return val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10170 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10171
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10172
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10173 DEFUN ("define-coding-system-alias", Fdefine_coding_system_alias,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10174 Sdefine_coding_system_alias, 2, 2, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10175 doc: /* Define ALIAS as an alias for CODING-SYSTEM. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10176 (Lisp_Object alias, Lisp_Object coding_system)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10177 {
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10178 Lisp_Object spec, aliases, eol_type, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10179
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10180 CHECK_SYMBOL (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10181 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10182 aliases = AREF (spec, 1);
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
10183 /* ALIASES should be a list of length more than zero, and the first
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10184 element is a base coding system. Append ALIAS at the tail of the
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10185 list. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10186 while (!NILP (XCDR (aliases)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10187 aliases = XCDR (aliases);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10188 XSETCDR (aliases, Fcons (alias, Qnil));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10189
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10190 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10191 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10192 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10193 Lisp_Object subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10194 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10195
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10196 subsidiaries = make_subsidiaries (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10197 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10198 Fdefine_coding_system_alias (AREF (subsidiaries, i),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10199 AREF (eol_type, i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10200 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10201
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10202 Fputhash (alias, spec, Vcoding_system_hash_table);
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10203 Vcoding_system_list = Fcons (alias, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10204 val = Fassoc (Fsymbol_name (alias), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10205 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10206 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (alias), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10207 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10208
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10209 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10210 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10211
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10212 DEFUN ("coding-system-base", Fcoding_system_base, Scoding_system_base,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10213 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10214 doc: /* Return the base of CODING-SYSTEM.
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10215 Any alias or subsidiary coding system is not a base coding system. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10216 (Lisp_Object coding_system)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10217 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10218 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10219
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10220 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10221 return (Qno_conversion);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10222 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10223 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10224 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10225 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10226
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10227 DEFUN ("coding-system-plist", Fcoding_system_plist, Scoding_system_plist,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10228 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10229 doc: "Return the property list of CODING-SYSTEM.")
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10230 (Lisp_Object coding_system)
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10231 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10232 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10233
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10234 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10235 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10236 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10237 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10238 return CODING_ATTR_PLIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10239 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10240
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10241
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10242 DEFUN ("coding-system-aliases", Fcoding_system_aliases, Scoding_system_aliases,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10243 1, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10244 doc: /* Return the list of aliases of CODING-SYSTEM. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10245 (Lisp_Object coding_system)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10246 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10247 Lisp_Object spec;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10248
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10249 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10250 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10251 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10252 return AREF (spec, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10253 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10254
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10255 DEFUN ("coding-system-eol-type", Fcoding_system_eol_type,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10256 Scoding_system_eol_type, 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10257 doc: /* Return eol-type of CODING-SYSTEM.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
10258 An eol-type is an integer 0, 1, 2, or a vector of coding systems.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10259
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10260 Integer values 0, 1, and 2 indicate a format of end-of-line; LF, CRLF,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10261 and CR respectively.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10262
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10263 A vector value indicates that a format of end-of-line should be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10264 detected automatically. Nth element of the vector is the subsidiary
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10265 coding system whose eol-type is N. */)
109179
8cfee7d2955f Convert DEFUNs to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109165
diff changeset
10266 (Lisp_Object coding_system)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10267 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10268 Lisp_Object spec, eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10269 int n;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10270
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10271 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10272 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10273 if (! CODING_SYSTEM_P (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10274 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10275 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10276 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10277 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10278 return Fcopy_sequence (eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10279 n = EQ (eol_type, Qunix) ? 0 : EQ (eol_type, Qdos) ? 1 : 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10280 return make_number (n);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10281 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10282
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10283 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10284
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10285
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10286 /*** 9. Post-amble ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10287
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
10288 void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
10289 init_coding_once (void)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10290 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10291 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10292
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10293 for (i = 0; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10294 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10295 coding_categories[i].id = -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10296 coding_priorities[i] = i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10297 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10298
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10299 /* ISO2022 specific initialize routine. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10300 for (i = 0; i < 0x20; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
10301 iso_code_class[i] = ISO_control_0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10302 for (i = 0x21; i < 0x7F; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10303 iso_code_class[i] = ISO_graphic_plane_0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10304 for (i = 0x80; i < 0xA0; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
10305 iso_code_class[i] = ISO_control_1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10306 for (i = 0xA1; i < 0xFF; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10307 iso_code_class[i] = ISO_graphic_plane_1;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10308 iso_code_class[0x20] = iso_code_class[0x7F] = ISO_0x20_or_0x7F;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10309 iso_code_class[0xA0] = iso_code_class[0xFF] = ISO_0xA0_or_0xFF;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10310 iso_code_class[ISO_CODE_SO] = ISO_shift_out;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10311 iso_code_class[ISO_CODE_SI] = ISO_shift_in;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10312 iso_code_class[ISO_CODE_SS2_7] = ISO_single_shift_2_7;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10313 iso_code_class[ISO_CODE_ESC] = ISO_escape;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10314 iso_code_class[ISO_CODE_SS2] = ISO_single_shift_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10315 iso_code_class[ISO_CODE_SS3] = ISO_single_shift_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10316 iso_code_class[ISO_CODE_CSI] = ISO_control_sequence_introducer;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10317
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10318 for (i = 0; i < 256; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10319 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10320 emacs_mule_bytes[i] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10321 }
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10322 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_11] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10323 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_12] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10324 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_21] = 4;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10325 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_22] = 4;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10326 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10327
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10328 #ifdef emacs
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10329
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
10330 void
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
10331 syms_of_coding (void)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10332 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10333 staticpro (&Vcoding_system_hash_table);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10334 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10335 Lisp_Object args[2];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10336 args[0] = QCtest;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10337 args[1] = Qeq;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10338 Vcoding_system_hash_table = Fmake_hash_table (2, args);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10339 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10340
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10341 staticpro (&Vsjis_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10342 Vsjis_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10343
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10344 staticpro (&Vbig5_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10345 Vbig5_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10346
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10347 staticpro (&Vcode_conversion_reused_workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10348 Vcode_conversion_reused_workbuf = Qnil;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10349
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
10350 staticpro (&Vcode_conversion_workbuf_name);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10351 Vcode_conversion_workbuf_name = make_pure_c_string (" *code-conversion-work*");
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
10352
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10353 reused_workbuf_in_use = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10354
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10355 DEFSYM (Qcharset, "charset");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10356 DEFSYM (Qtarget_idx, "target-idx");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10357 DEFSYM (Qcoding_system_history, "coding-system-history");
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
10358 Fset (Qcoding_system_history, Qnil);
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
10359
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10360 /* Target FILENAME is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10361 Fput (Qinsert_file_contents, Qtarget_idx, make_number (0));
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10362 /* Target FILENAME is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10363 Fput (Qwrite_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10364
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10365 DEFSYM (Qcall_process, "call-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10366 /* Target PROGRAM is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10367 Fput (Qcall_process, Qtarget_idx, make_number (0));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10368
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10369 DEFSYM (Qcall_process_region, "call-process-region");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10370 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10371 Fput (Qcall_process_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10372
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10373 DEFSYM (Qstart_process, "start-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10374 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10375 Fput (Qstart_process, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10376
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10377 DEFSYM (Qopen_network_stream, "open-network-stream");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10378 /* Target SERVICE is the fourth argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10379 Fput (Qopen_network_stream, Qtarget_idx, make_number (3));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10380
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10381 DEFSYM (Qcoding_system, "coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10382 DEFSYM (Qcoding_aliases, "coding-aliases");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10383
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10384 DEFSYM (Qeol_type, "eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10385 DEFSYM (Qunix, "unix");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10386 DEFSYM (Qdos, "dos");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10387
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10388 DEFSYM (Qbuffer_file_coding_system, "buffer-file-coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10389 DEFSYM (Qpost_read_conversion, "post-read-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10390 DEFSYM (Qpre_write_conversion, "pre-write-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10391 DEFSYM (Qdefault_char, "default-char");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10392 DEFSYM (Qundecided, "undecided");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10393 DEFSYM (Qno_conversion, "no-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10394 DEFSYM (Qraw_text, "raw-text");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10395
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10396 DEFSYM (Qiso_2022, "iso-2022");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10397
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10398 DEFSYM (Qutf_8, "utf-8");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10399 DEFSYM (Qutf_8_emacs, "utf-8-emacs");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10400
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10401 DEFSYM (Qutf_16, "utf-16");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10402 DEFSYM (Qbig, "big");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10403 DEFSYM (Qlittle, "little");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10404
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10405 DEFSYM (Qshift_jis, "shift-jis");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10406 DEFSYM (Qbig5, "big5");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10407
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10408 DEFSYM (Qcoding_system_p, "coding-system-p");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10409
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10410 DEFSYM (Qcoding_system_error, "coding-system-error");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10411 Fput (Qcoding_system_error, Qerror_conditions,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10412 pure_cons (Qcoding_system_error, pure_cons (Qerror, Qnil)));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10413 Fput (Qcoding_system_error, Qerror_message,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10414 make_pure_c_string ("Invalid coding system"));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10415
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10416 /* Intern this now in case it isn't already done.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10417 Setting this variable twice is harmless.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10418 But don't staticpro it here--that is done in alloc.c. */
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10419 Qchar_table_extra_slots = intern_c_string ("char-table-extra-slots");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10420
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10421 DEFSYM (Qtranslation_table, "translation-table");
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
10422 Fput (Qtranslation_table, Qchar_table_extra_slots, make_number (2));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10423 DEFSYM (Qtranslation_table_id, "translation-table-id");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10424 DEFSYM (Qtranslation_table_for_decode, "translation-table-for-decode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10425 DEFSYM (Qtranslation_table_for_encode, "translation-table-for-encode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10426
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10427 DEFSYM (Qvalid_codes, "valid-codes");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10428
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10429 DEFSYM (Qemacs_mule, "emacs-mule");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10430
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10431 DEFSYM (QCcategory, ":category");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10432 DEFSYM (QCmnemonic, ":mnemonic");
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
10433 DEFSYM (QCdefault_char, ":default-char");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10434 DEFSYM (QCdecode_translation_table, ":decode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10435 DEFSYM (QCencode_translation_table, ":encode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10436 DEFSYM (QCpost_read_conversion, ":post-read-conversion");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10437 DEFSYM (QCpre_write_conversion, ":pre-write-conversion");
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10438 DEFSYM (QCascii_compatible_p, ":ascii-compatible-p");
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10439
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10440 Vcoding_category_table
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10441 = Fmake_vector (make_number (coding_category_max), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10442 staticpro (&Vcoding_category_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10443 /* Followings are target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10444 ASET (Vcoding_category_table, coding_category_iso_7,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10445 intern_c_string ("coding-category-iso-7"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10446 ASET (Vcoding_category_table, coding_category_iso_7_tight,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10447 intern_c_string ("coding-category-iso-7-tight"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10448 ASET (Vcoding_category_table, coding_category_iso_8_1,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10449 intern_c_string ("coding-category-iso-8-1"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10450 ASET (Vcoding_category_table, coding_category_iso_8_2,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10451 intern_c_string ("coding-category-iso-8-2"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10452 ASET (Vcoding_category_table, coding_category_iso_7_else,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10453 intern_c_string ("coding-category-iso-7-else"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10454 ASET (Vcoding_category_table, coding_category_iso_8_else,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10455 intern_c_string ("coding-category-iso-8-else"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10456 ASET (Vcoding_category_table, coding_category_utf_8_auto,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10457 intern_c_string ("coding-category-utf-8-auto"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10458 ASET (Vcoding_category_table, coding_category_utf_8_nosig,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10459 intern_c_string ("coding-category-utf-8"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10460 ASET (Vcoding_category_table, coding_category_utf_8_sig,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10461 intern_c_string ("coding-category-utf-8-sig"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10462 ASET (Vcoding_category_table, coding_category_utf_16_be,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10463 intern_c_string ("coding-category-utf-16-be"));
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10464 ASET (Vcoding_category_table, coding_category_utf_16_auto,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10465 intern_c_string ("coding-category-utf-16-auto"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10466 ASET (Vcoding_category_table, coding_category_utf_16_le,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10467 intern_c_string ("coding-category-utf-16-le"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10468 ASET (Vcoding_category_table, coding_category_utf_16_be_nosig,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10469 intern_c_string ("coding-category-utf-16-be-nosig"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10470 ASET (Vcoding_category_table, coding_category_utf_16_le_nosig,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10471 intern_c_string ("coding-category-utf-16-le-nosig"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10472 ASET (Vcoding_category_table, coding_category_charset,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10473 intern_c_string ("coding-category-charset"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10474 ASET (Vcoding_category_table, coding_category_sjis,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10475 intern_c_string ("coding-category-sjis"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10476 ASET (Vcoding_category_table, coding_category_big5,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10477 intern_c_string ("coding-category-big5"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10478 ASET (Vcoding_category_table, coding_category_ccl,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10479 intern_c_string ("coding-category-ccl"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10480 ASET (Vcoding_category_table, coding_category_emacs_mule,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10481 intern_c_string ("coding-category-emacs-mule"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10482 /* Followings are NOT target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10483 ASET (Vcoding_category_table, coding_category_raw_text,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10484 intern_c_string ("coding-category-raw-text"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10485 ASET (Vcoding_category_table, coding_category_undecided,
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10486 intern_c_string ("coding-category-undecided"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10487
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10488 DEFSYM (Qinsufficient_source, "insufficient-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10489 DEFSYM (Qinconsistent_eol, "inconsistent-eol");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10490 DEFSYM (Qinvalid_source, "invalid-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10491 DEFSYM (Qinterrupted, "interrupted");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10492 DEFSYM (Qinsufficient_memory, "insufficient-memory");
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
10493 DEFSYM (Qcoding_system_define_form, "coding-system-define-form");
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
10494
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10495 defsubr (&Scoding_system_p);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10496 defsubr (&Sread_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10497 defsubr (&Sread_non_nil_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10498 defsubr (&Scheck_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10499 defsubr (&Sdetect_coding_region);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10500 defsubr (&Sdetect_coding_string);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10501 defsubr (&Sfind_coding_systems_region_internal);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
10502 defsubr (&Sunencodable_char_position);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10503 defsubr (&Scheck_coding_systems_region);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10504 defsubr (&Sdecode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10505 defsubr (&Sencode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10506 defsubr (&Sdecode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10507 defsubr (&Sencode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10508 defsubr (&Sdecode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10509 defsubr (&Sencode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10510 defsubr (&Sdecode_big5_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10511 defsubr (&Sencode_big5_char);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10512 defsubr (&Sset_terminal_coding_system_internal);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10513 defsubr (&Sset_safe_terminal_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10514 defsubr (&Sterminal_coding_system);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10515 defsubr (&Sset_keyboard_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10516 defsubr (&Skeyboard_coding_system);
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
10517 defsubr (&Sfind_operation_coding_system);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10518 defsubr (&Sset_coding_system_priority);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10519 defsubr (&Sdefine_coding_system_internal);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10520 defsubr (&Sdefine_coding_system_alias);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10521 defsubr (&Scoding_system_put);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10522 defsubr (&Scoding_system_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10523 defsubr (&Scoding_system_plist);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10524 defsubr (&Scoding_system_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10525 defsubr (&Scoding_system_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10526 defsubr (&Scoding_system_priority_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10527
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10528 DEFVAR_LISP ("coding-system-list", &Vcoding_system_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10529 doc: /* List of coding systems.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10530
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10531 Do not alter the value of this variable manually. This variable should be
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10532 updated by the functions `define-coding-system' and
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10533 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10534 Vcoding_system_list = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10535
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10536 DEFVAR_LISP ("coding-system-alist", &Vcoding_system_alist,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10537 doc: /* Alist of coding system names.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10538 Each element is one element list of coding system name.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10539 This variable is given to `completing-read' as COLLECTION argument.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10540
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10541 Do not alter the value of this variable manually. This variable should be
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10542 updated by the functions `make-coding-system' and
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10543 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10544 Vcoding_system_alist = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10545
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10546 DEFVAR_LISP ("coding-category-list", &Vcoding_category_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10547 doc: /* List of coding-categories (symbols) ordered by priority.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10548
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10549 On detecting a coding system, Emacs tries code detection algorithms
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10550 associated with each coding-category one by one in this order. When
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10551 one algorithm agrees with a byte sequence of source text, the coding
60608
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10552 system bound to the corresponding coding-category is selected.
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10553
111402
435e622dd41e Refer to set-coding-system-priority instead of the obsolete
Lars Magne Ingebrigtsen <larsi@gnus.org>
parents: 111237
diff changeset
10554 Don't modify this variable directly, but use `set-coding-system-priority'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10555 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10556 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10557
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10558 Vcoding_category_list = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10559 for (i = coding_category_max - 1; i >= 0; i--)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10560 Vcoding_category_list
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10561 = Fcons (XVECTOR (Vcoding_category_table)->contents[i],
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10562 Vcoding_category_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10563 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10564
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10565 DEFVAR_LISP ("coding-system-for-read", &Vcoding_system_for_read,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10566 doc: /* Specify the coding system for read operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10567 It is useful to bind this variable with `let', but do not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10568 If the value is a coding system, it is used for decoding on read operation.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10569 If not, an appropriate element is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10570 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10571 `process-coding-system-alist', and `network-coding-system-alist'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10572 Vcoding_system_for_read = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10573
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10574 DEFVAR_LISP ("coding-system-for-write", &Vcoding_system_for_write,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10575 doc: /* Specify the coding system for write operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10576 Programs bind this variable with `let', but you should not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10577 If the value is a coding system, it is used for encoding of output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10578 when writing it to a file and when sending it to a file or subprocess.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10579
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10580 If this does not specify a coding system, an appropriate element
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10581 is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10582 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10583 `process-coding-system-alist', and `network-coding-system-alist'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10584 For output to files, if the above procedure does not specify a coding system,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10585 the value of `buffer-file-coding-system' is used. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10586 Vcoding_system_for_write = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10587
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10588 DEFVAR_LISP ("last-coding-system-used", &Vlast_coding_system_used,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10589 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10590 Coding system used in the latest file or process I/O. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10591 Vlast_coding_system_used = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10592
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10593 DEFVAR_LISP ("last-code-conversion-error", &Vlast_code_conversion_error,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10594 doc: /*
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10595 Error status of the last code conversion.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10596
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10597 When an error was detected in the last code conversion, this variable
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10598 is set to one of the following symbols.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10599 `insufficient-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10600 `inconsistent-eol'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10601 `invalid-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10602 `interrupted'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10603 `insufficient-memory'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10604 When no error was detected, the value doesn't change. So, to check
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10605 the error status of a code conversion by this variable, you must
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10606 explicitly set this variable to nil before performing code
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10607 conversion. */);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10608 Vlast_code_conversion_error = Qnil;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10609
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10610 DEFVAR_BOOL ("inhibit-eol-conversion", &inhibit_eol_conversion,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10611 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10612 *Non-nil means always inhibit code conversion of end-of-line format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10613 See info node `Coding Systems' and info node `Text and Binary' concerning
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10614 such conversion. */);
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10615 inhibit_eol_conversion = 0;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10616
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10617 DEFVAR_BOOL ("inherit-process-coding-system", &inherit_process_coding_system,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10618 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10619 Non-nil means process buffer inherits coding system of process output.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10620 Bind it to t if the process output is to be treated as if it were a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10621 read from some filesystem. */);
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10622 inherit_process_coding_system = 0;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10623
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10624 DEFVAR_LISP ("file-coding-system-alist", &Vfile_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10625 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10626 Alist to decide a coding system to use for a file I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10627 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10628 where PATTERN is a regular expression matching a file name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10629 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10630 If VAL is a coding system, it is used for both decoding and encoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10631 the file contents.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10632 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10633 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10634 If VAL is a function symbol, the function must return a coding system
72323
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10635 or a cons of coding systems which are used as above. The function is
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10636 called with an argument that is a list of the arguments with which
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10637 `find-operation-coding-system' was called. If the function can't decide
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10638 a coding system, it can return `undecided' so that the normal
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10639 code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10640
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10641 See also the function `find-operation-coding-system'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10642 and the variable `auto-coding-alist'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10643 Vfile_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10644
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10645 DEFVAR_LISP ("process-coding-system-alist", &Vprocess_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10646 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10647 Alist to decide a coding system to use for a process I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10648 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10649 where PATTERN is a regular expression matching a program name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10650 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10651 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10652 from the program and encoding what sent to the program.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10653 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10654 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10655 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10656 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10657
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10658 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10659 Vprocess_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10660
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10661 DEFVAR_LISP ("network-coding-system-alist", &Vnetwork_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10662 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10663 Alist to decide a coding system to use for a network I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10664 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10665 where PATTERN is a regular expression matching a network service name
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10666 or is a port number to connect to,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10667 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10668 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10669 from the network stream and encoding what sent to the network stream.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10670 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10671 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10672 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10673 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10674
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10675 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10676 Vnetwork_coding_system_alist = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10677
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10678 DEFVAR_LISP ("locale-coding-system", &Vlocale_coding_system,
41026
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10679 doc: /* Coding system to use with system messages.
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10680 Also used for decoding keyboard input on X Window system. */);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10681 Vlocale_coding_system = Qnil;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10682
29182
1d1c27067af4 (encode_eol): Add null statement after label.
Dave Love <fx@gnu.org>
parents: 29172
diff changeset
10683 /* The eol mnemonics are reset in startup.el system-dependently. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10684 DEFVAR_LISP ("eol-mnemonic-unix", &eol_mnemonic_unix,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10685 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10686 *String displayed in mode line for UNIX-like (LF) end-of-line format. */);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10687 eol_mnemonic_unix = make_pure_c_string (":");
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10688
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10689 DEFVAR_LISP ("eol-mnemonic-dos", &eol_mnemonic_dos,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10690 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10691 *String displayed in mode line for DOS-like (CRLF) end-of-line format. */);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10692 eol_mnemonic_dos = make_pure_c_string ("\\");
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10693
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10694 DEFVAR_LISP ("eol-mnemonic-mac", &eol_mnemonic_mac,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10695 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10696 *String displayed in mode line for MAC-like (CR) end-of-line format. */);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10697 eol_mnemonic_mac = make_pure_c_string ("/");
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10698
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10699 DEFVAR_LISP ("eol-mnemonic-undecided", &eol_mnemonic_undecided,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10700 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10701 *String displayed in mode line when end-of-line format is not yet determined. */);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10702 eol_mnemonic_undecided = make_pure_c_string (":");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10703
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10704 DEFVAR_LISP ("enable-character-translation", &Venable_character_translation,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10705 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10706 *Non-nil enables character translation while encoding and decoding. */);
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10707 Venable_character_translation = Qt;
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10708
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10709 DEFVAR_LISP ("standard-translation-table-for-decode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10710 &Vstandard_translation_table_for_decode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10711 doc: /* Table for translating characters while decoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10712 Vstandard_translation_table_for_decode = Qnil;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10713
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10714 DEFVAR_LISP ("standard-translation-table-for-encode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10715 &Vstandard_translation_table_for_encode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10716 doc: /* Table for translating characters while encoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10717 Vstandard_translation_table_for_encode = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10718
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10719 DEFVAR_LISP ("charset-revision-table", &Vcharset_revision_table,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10720 doc: /* Alist of charsets vs revision numbers.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10721 While encoding, if a charset (car part of an element) is found,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10722 designate it with the escape sequence identifying revision (cdr part
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10723 of the element). */);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10724 Vcharset_revision_table = Qnil;
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10725
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10726 DEFVAR_LISP ("default-process-coding-system",
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10727 &Vdefault_process_coding_system,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10728 doc: /* Cons of coding systems used for process I/O by default.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10729 The car part is used for decoding a process output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10730 the cdr part is used for encoding a text to be sent to a process. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10731 Vdefault_process_coding_system = Qnil;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10732
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10733 DEFVAR_LISP ("latin-extra-code-table", &Vlatin_extra_code_table,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10734 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10735 Table of extra Latin codes in the range 128..159 (inclusive).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10736 This is a vector of length 256.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10737 If Nth element is non-nil, the existence of code N in a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10738 \(or output of subprocess) doesn't prevent it to be detected as
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10739 a coding system of ISO 2022 variant which has a flag
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10740 `accept-latin-extra-code' t (e.g. iso-latin-1) on reading a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10741 or reading output of a subprocess.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10742 Only 128th through 159th elements have a meaning. */);
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10743 Vlatin_extra_code_table = Fmake_vector (make_number (256), Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10744
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10745 DEFVAR_LISP ("select-safe-coding-system-function",
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10746 &Vselect_safe_coding_system_function,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10747 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10748 Function to call to select safe coding system for encoding a text.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10749
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10750 If set, this function is called to force a user to select a proper
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10751 coding system which can encode the text in the case that a default
87778
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10752 coding system used in each operation can't encode the text. The
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10753 function should take care that the buffer is not modified while
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10754 the coding system is being selected.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10755
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10756 The default value is `select-safe-coding-system' (which see). */);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10757 Vselect_safe_coding_system_function = Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10758
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10759 DEFVAR_BOOL ("coding-system-require-warning",
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10760 &coding_system_require_warning,
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10761 doc: /* Internal use only.
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10762 If non-nil, on writing a file, `select-safe-coding-system-function' is
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10763 called even if `coding-system-for-write' is non-nil. The command
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10764 `universal-coding-system-argument' binds this variable to t temporarily. */);
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10765 coding_system_require_warning = 0;
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10766
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10767
30292
14a9937df1f5 (syms_of_coding): Fix typo in spelling of variable
Gerd Moellmann <gerd@gnu.org>
parents: 30263
diff changeset
10768 DEFVAR_BOOL ("inhibit-iso-escape-detection",
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10769 &inhibit_iso_escape_detection,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10770 doc: /*
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10771 If non-nil, Emacs ignores ISO-2022 escape sequences during code detection.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10772
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10773 When Emacs reads text, it tries to detect how the text is encoded.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10774 This code detection is sensitive to escape sequences. If Emacs sees
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10775 a valid ISO-2022 escape sequence, it assumes the text is encoded in one
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10776 of the ISO2022 encodings, and decodes text by the corresponding coding
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10777 system (e.g. `iso-2022-7bit').
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10778
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10779 However, there may be a case that you want to read escape sequences in
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10780 a file as is. In such a case, you can set this variable to non-nil.
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10781 Then the code detection will ignore any escape sequences, and no text is
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10782 detected as encoded in some ISO-2022 encoding. The result is that all
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10783 escape sequences become visible in a buffer.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10784
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10785 The default value is nil, and it is strongly recommended not to change
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10786 it. That is because many Emacs Lisp source files that contain
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10787 non-ASCII characters are encoded by the coding system `iso-2022-7bit'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10788 in Emacs's distribution, and they won't be decoded correctly on
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10789 reading if you suppress escape sequence detection.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10790
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10791 The other way to read escape sequences in a file without decoding is
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10792 to explicitly specify some coding system that doesn't use ISO-2022
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10793 escape sequence (e.g `latin-1') on reading by \\[universal-coding-system-argument]. */);
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10794 inhibit_iso_escape_detection = 0;
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10795
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10796 DEFVAR_BOOL ("inhibit-null-byte-detection",
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10797 &inhibit_null_byte_detection,
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10798 doc: /* If non-nil, Emacs ignores null bytes on code detection.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10799 By default, Emacs treats it as binary data, and does not attempt to
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10800 decode it. The effect is as if you specified `no-conversion' for
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10801 reading that text.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10802
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10803 Set this to non-nil when a regular text happens to include null bytes.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10804 Examples are Index nodes of Info files and null-byte delimited output
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10805 from GNU Find and GNU Grep. Emacs will then ignore the null bytes and
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10806 decode text as usual. */);
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10807 inhibit_null_byte_detection = 0;
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10808
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10809 DEFVAR_LISP ("translation-table-for-input", &Vtranslation_table_for_input,
48230
c2ce8280fb97 (Vtranslation_table_for_input): New.
Dave Love <fx@gnu.org>
parents: 48182
diff changeset
10810 doc: /* Char table for translating self-inserting characters.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10811 This is applied to the result of input methods, not their input.
101854
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10812 See also `keyboard-translate-table'.
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10813
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10814 Use of this variable for character code unification was rendered
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10815 obsolete in Emacs 23.1 and later, since Unicode is now the basis of
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10816 internal character representation. */);
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10817 Vtranslation_table_for_input = Qnil;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10818
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10819 {
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10820 Lisp_Object args[coding_arg_max];
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10821 Lisp_Object plist[16];
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10822 int i;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10823
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10824 for (i = 0; i < coding_arg_max; i++)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10825 args[i] = Qnil;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10826
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10827 plist[0] = intern_c_string (":name");
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10828 plist[1] = args[coding_arg_name] = Qno_conversion;
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10829 plist[2] = intern_c_string (":mnemonic");
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10830 plist[3] = args[coding_arg_mnemonic] = make_number ('=');
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10831 plist[4] = intern_c_string (":coding-type");
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10832 plist[5] = args[coding_arg_coding_type] = Qraw_text;
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10833 plist[6] = intern_c_string (":ascii-compatible-p");
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10834 plist[7] = args[coding_arg_ascii_compatible_p] = Qt;
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10835 plist[8] = intern_c_string (":default-char");
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10836 plist[9] = args[coding_arg_default_char] = make_number (0);
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10837 plist[10] = intern_c_string (":for-unibyte");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10838 plist[11] = args[coding_arg_for_unibyte] = Qt;
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10839 plist[12] = intern_c_string (":docstring");
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10840 plist[13] = make_pure_c_string ("Do no conversion.\n\
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10841 \n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10842 When you visit a file with this coding, the file is read into a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10843 unibyte buffer as is, thus each byte of a file is treated as a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10844 character.");
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10845 plist[14] = intern_c_string (":eol-type");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10846 plist[15] = args[coding_arg_eol_type] = Qunix;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10847 args[coding_arg_plist] = Flist (16, plist);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10848 Fdefine_coding_system_internal (coding_arg_max, args);
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10849
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10850 plist[1] = args[coding_arg_name] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10851 plist[3] = args[coding_arg_mnemonic] = make_number ('-');
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10852 plist[5] = args[coding_arg_coding_type] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10853 /* This is already set.
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10854 plist[7] = args[coding_arg_ascii_compatible_p] = Qt; */
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10855 plist[8] = intern_c_string (":charset-list");
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10856 plist[9] = args[coding_arg_charset_list] = Fcons (Qascii, Qnil);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10857 plist[11] = args[coding_arg_for_unibyte] = Qnil;
105877
21bdda3ded62 * xterm.c (syms_of_xterm):
Dan Nicolaescu <dann@ics.uci.edu>
parents: 105669
diff changeset
10858 plist[13] = make_pure_c_string ("No conversion on encoding, automatic conversion on decoding.");
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10859 plist[15] = args[coding_arg_eol_type] = Qnil;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10860 args[coding_arg_plist] = Flist (16, plist);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10861 Fdefine_coding_system_internal (coding_arg_max, args);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10862 }
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10863
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10864 setup_coding_system (Qno_conversion, &safe_terminal_coding);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10865
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10866 {
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10867 int i;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10868
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10869 for (i = 0; i < coding_category_max; i++)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10870 Fset (AREF (Vcoding_category_table, i), Qno_conversion);
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10871 }
109158
6175ebc3b6ce * coding.c: Use SPECPDL_INDEX, DOS_NT.
Juanma Barranquero <lekktu@gmail.com>
parents: 109126
diff changeset
10872 #if defined (DOS_NT)
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10873 system_eol_type = Qdos;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10874 #else
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10875 system_eol_type = Qunix;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10876 #endif
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10877 staticpro (&system_eol_type);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10878 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10879
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10880 char *
109126
aec1143e8d85 Convert (most) functions in src to standard C.
Dan Nicolaescu <dann@ics.uci.edu>
parents: 109100
diff changeset
10881 emacs_strerror (int error_number)
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10882 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10883 char *str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10884
26526
b7438760079b * callproc.c (strerror): Remove decl.
Paul Eggert <eggert@twinsun.com>
parents: 26240
diff changeset
10885 synchronize_system_messages_locale ();
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10886 str = strerror (error_number);
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10887
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10888 if (! NILP (Vlocale_coding_system))
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10889 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10890 Lisp_Object dec = code_convert_string_norecord (build_string (str),
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10891 Vlocale_coding_system,
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10892 0);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
10893 str = (char *) SDATA (dec);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10894 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10895
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10896 return str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10897 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10898
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10899 #endif /* emacs */