annotate src/coding.c @ 100587:d91e3320dd81

(decode_coding): Clear chars_at_source flag when using charbuf.
author Jason Rumney <jasonr@gnu.org>
date Sat, 20 Dec 2008 07:59:33 +0000
parents 3e044fa54e4f
children 5c5e6d041634
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88936
c6ed294ee664 Comment fix
Dave Love <fx@gnu.org>
parents: 88889
diff changeset
1 /* Coding system handler (conversion, detection, etc).
68651
3bd95f4f2941 Update years in copyright notice; nfc.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents: 68567
diff changeset
2 Copyright (C) 2001, 2002, 2003, 2004, 2005,
79759
fc2bcd2a8aad Add 2008 to copyright years.
Glenn Morris <rgm@gnu.org>
parents: 79107
diff changeset
3 2006, 2007, 2008 Free Software Foundation, Inc.
74605
6ee41fdd69ff Update AIST copyright years.
Kenichi Handa <handa@m17n.org>
parents: 73995
diff changeset
4 Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
79759
fc2bcd2a8aad Add 2008 to copyright years.
Glenn Morris <rgm@gnu.org>
parents: 79107
diff changeset
5 2005, 2006, 2007, 2008
67658
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
7 Registration Number H14PRO021
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8 Copyright (C) 2003
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9 National Institute of Advanced Industrial Science and Technology (AIST)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10 Registration Number H13PRO009
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
11
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
12 This file is part of GNU Emacs.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
13
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
14 GNU Emacs is free software: you can redistribute it and/or modify
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
15 it under the terms of the GNU General Public License as published by
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
16 the Free Software Foundation, either version 3 of the License, or
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
17 (at your option) any later version.
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
18
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
19 GNU Emacs is distributed in the hope that it will be useful,
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
20 but WITHOUT ANY WARRANTY; without even the implied warranty of
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
21 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
22 GNU General Public License for more details.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
23
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
24 You should have received a copy of the GNU General Public License
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
25 along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
26
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
27 /*** TABLE OF CONTENTS ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
28
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
29 0. General comments
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
30 1. Preamble
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
31 2. Emacs' internal format (emacs-utf-8) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
32 3. UTF-8 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
33 4. UTF-16 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
34 5. Charset-base coding systems handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
35 6. emacs-mule (old Emacs' internal format) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
36 7. ISO2022 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
37 8. Shift-JIS and BIG5 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
38 9. CCL handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
39 10. C library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
40 11. Emacs Lisp library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
41 12. Postamble
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
42
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
43 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
44
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
45 /*** 0. General comments ***
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
46
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
47
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
48 CODING SYSTEM
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
49
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
50 A coding system is an object for an encoding mechanism that contains
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
51 information about how to convert byte sequences to character
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
52 sequences and vice versa. When we say "decode", it means converting
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
53 a byte sequence of a specific coding system into a character
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
54 sequence that is represented by Emacs' internal coding system
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
55 `emacs-utf-8', and when we say "encode", it means converting a
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
56 character sequence of emacs-utf-8 to a byte sequence of a specific
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
57 coding system.
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
58
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
59 In Emacs Lisp, a coding system is represented by a Lisp symbol. In
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
60 C level, a coding system is represented by a vector of attributes
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
61 stored in the hash table Vcharset_hash_table. The conversion from
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
62 coding system symbol to attributes vector is done by looking up
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
63 Vcharset_hash_table by the symbol.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
64
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
65 Coding systems are classified into the following types depending on
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
66 the encoding mechanism. Here's a brief description of the types.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
67
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
68 o UTF-8
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
69
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
70 o UTF-16
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
71
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
72 o Charset-base coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
73
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
74 A coding system defined by one or more (coded) character sets.
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
75 Decoding and encoding are done by a code converter defined for each
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
76 character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
77
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
78 o Old Emacs internal format (emacs-mule)
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
79
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
80 The coding system adopted by old versions of Emacs (20 and 21).
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
81
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
82 o ISO2022-base coding system
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
83
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
84 The most famous coding system for multiple character sets. X's
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
85 Compound Text, various EUCs (Extended Unix Code), and coding systems
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
86 used in the Internet communication such as ISO-2022-JP are all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
87 variants of ISO2022.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
88
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
89 o SJIS (or Shift-JIS or MS-Kanji-Code)
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
90
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
91 A coding system to encode character sets: ASCII, JISX0201, and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
92 JISX0208. Widely used for PC's in Japan. Details are described in
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
93 section 8.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
94
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
95 o BIG5
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
96
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
97 A coding system to encode character sets: ASCII and Big5. Widely
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
98 used for Chinese (mainly in Taiwan and Hong Kong). Details are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
99 described in section 8. In this file, when we write "big5" (all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
100 lowercase), we mean the coding system, and when we write "Big5"
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
101 (capitalized), we mean the character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
102
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
103 o CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
104
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
105 If a user wants to decode/encode text encoded in a coding system
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
106 not listed above, he can supply a decoder and an encoder for it in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
107 CCL (Code Conversion Language) programs. Emacs executes the CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
108 program while decoding/encoding.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
109
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
110 o Raw-text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
111
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
112 A coding system for text containing raw eight-bit data. Emacs
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
113 treats each byte of source text as a character (except for
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
114 end-of-line conversion).
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
115
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
116 o No-conversion
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
117
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
118 Like raw text, but don't do end-of-line conversion.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
119
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
120
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
121 END-OF-LINE FORMAT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
122
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
123 How text end-of-line is encoded depends on operating system. For
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
124 instance, Unix's format is just one byte of LF (line-feed) code,
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
125 whereas DOS's format is two-byte sequence of `carriage-return' and
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
126 `line-feed' codes. MacOS's format is usually one byte of
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
127 `carriage-return'.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
128
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
129 Since text character encoding and end-of-line encoding are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
130 independent, any coding system described above can take any format
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
131 of end-of-line (except for no-conversion).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
132
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
133 STRUCT CODING_SYSTEM
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
134
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
135 Before using a coding system for code conversion (i.e. decoding and
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
136 encoding), we setup a structure of type `struct coding_system'.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
137 This structure keeps various information about a specific code
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
138 conversion (e.g. the location of source and destination data).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
139
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
140 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
141
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
142 /* COMMON MACROS */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
143
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
144
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
145 /*** GENERAL NOTES on `detect_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
146
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
147 These functions check if a byte sequence specified as a source in
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
148 CODING conforms to the format of XXX, and update the members of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
149 DETECT_INFO.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
150
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
151 Return 1 if the byte sequence conforms to XXX, otherwise return 0.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
152
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
153 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
154
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
155 #if 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
156 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
157 detect_coding_XXX (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
158 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
159 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
160 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
161 const unsigned char *src = coding->source;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
162 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
163 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
164 int consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
165 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
166 ...;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
167
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
168 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
169 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
170 /* Get one byte from the source. If the souce is exausted, jump
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
171 to no_more_source:. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
172 ONE_MORE_BYTE (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
173
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
174 if (! __C_conforms_to_XXX___ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
175 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
176 if (! __C_strongly_suggests_XXX__ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
177 found = CATEGORY_MASK_XXX;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
178 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
179 /* The byte sequence is invalid for XXX. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
180 detect_info->rejected |= CATEGORY_MASK_XXX;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
181 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
182
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
183 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
184 /* The source exausted successfully. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
185 detect_info->found |= found;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
186 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
187 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
188 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
189
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
190 /*** GENERAL NOTES on `decode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
191
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
192 These functions decode a byte sequence specified as a source by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
193 CODING. The resulting multibyte text goes to a place pointed to by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
194 CODING->charbuf, the length of which should not exceed
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
195 CODING->charbuf_size;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
196
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
197 These functions set the information of original and decoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
198 CODING->consumed, CODING->consumed_char, and CODING->charbuf_used.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
199 They also set CODING->result to one of CODING_RESULT_XXX indicating
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
200 how the decoding is finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
201
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
202 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
203
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
204 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
205 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
206 decode_coding_XXXX (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
207 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
208 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
209 const unsigned char *src = coding->source + coding->consumed;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
210 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
211 /* SRC_BASE remembers the start position in source in each loop.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
212 The loop will be exited when there's not enough source code, or
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
213 when there's no room in CHARBUF for a decoded character. */
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
214 const unsigned char *src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
215 /* A buffer to produce decoded characters. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
216 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
217 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
218 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
219
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
220 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
221 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
222 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
223 if (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
224 /* No more room to produce a decoded character. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
225 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
226 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
227 /* Decode it. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
228 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
229
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
230 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
231 if (src_base < src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
232 && coding->mode & CODING_MODE_LAST_BLOCK)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
233 /* If the source ends by partial bytes to construct a character,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
234 treat them as eight-bit raw data. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
235 while (src_base < src_end && charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
236 *charbuf++ = *src_base++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
237 /* Remember how many bytes and characters we consumed. If the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
238 source is multibyte, the bytes and chars are not identical. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
239 coding->consumed = coding->consumed_char = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
240 /* Remember how many characters we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
241 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
242 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
243 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
244
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
245 /*** GENERAL NOTES on `encode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
246
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
247 These functions encode SRC_BYTES length text at SOURCE of Emacs'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
248 internal multibyte format by CODING. The resulting byte sequence
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
249 goes to a place pointed to by DESTINATION, the length of which
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
250 should not exceed DST_BYTES.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
251
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
252 These functions set the information of original and encoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
253 the members produced, produced_char, consumed, and consumed_char of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
254 the structure *CODING. They also set the member result to one of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
255 CODING_RESULT_XXX indicating how the encoding finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
256
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
257 DST_BYTES zero means that source area and destination area are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
258 overlapped, which means that we can produce a encoded text until it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
259 reaches at the head of not-yet-encoded source text.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
260
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
261 Below is a template of these functions. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
262 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
263 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
264 encode_coding_XXX (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
265 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
266 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
267 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
268 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
269 int *charbuf_end = charbuf->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
270 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
271 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
272 unsigned char *adjusted_dst_end = dst_end - _MAX_BYTES_PRODUCED_IN_LOOP_;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
273 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
274
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
275 for (; charbuf < charbuf_end && dst < adjusted_dst_end; charbuf++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
276 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
277 int c = *charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
278 /* Encode C into DST, and increment DST. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
279 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
280 label_no_more_destination:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
281 /* How many chars and bytes we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
282 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
283 coding->produced = dst - coding->destination;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
284 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
285 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
286
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
287
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
288 /*** 1. Preamble ***/
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
289
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
290 #include <config.h>
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
291 #include <stdio.h>
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
292
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
293 #include "lisp.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
294 #include "buffer.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
295 #include "character.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
296 #include "charset.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
297 #include "ccl.h"
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
298 #include "composite.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
299 #include "coding.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
300 #include "window.h"
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
301 #include "frame.h"
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
302 #include "termhooks.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
303
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
304 Lisp_Object Vcoding_system_hash_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
305
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
306 Lisp_Object Qcoding_system, Qcoding_aliases, Qeol_type;
88646
d3b1f30e2267 (Qmac): Remove (duplicated) definition.
Dave Love <fx@gnu.org>
parents: 88645
diff changeset
307 Lisp_Object Qunix, Qdos;
d3b1f30e2267 (Qmac): Remove (duplicated) definition.
Dave Love <fx@gnu.org>
parents: 88645
diff changeset
308 extern Lisp_Object Qmac; /* frame.c */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
309 Lisp_Object Qbuffer_file_coding_system;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
310 Lisp_Object Qpost_read_conversion, Qpre_write_conversion;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
311 Lisp_Object Qdefault_char;
19612
783efd6c7c1e (Qno_conversion, Qundecided): New variables.
Kenichi Handa <handa@m17n.org>
parents: 19546
diff changeset
312 Lisp_Object Qno_conversion, Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
313 Lisp_Object Qcharset, Qiso_2022, Qutf_8, Qutf_16, Qshift_jis, Qbig5;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
314 Lisp_Object Qbig, Qlittle;
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
315 Lisp_Object Qcoding_system_history;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
316 Lisp_Object Qvalid_codes;
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
317 Lisp_Object QCcategory, QCmnemonic, QCdefault_char;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
318 Lisp_Object QCdecode_translation_table, QCencode_translation_table;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
319 Lisp_Object QCpost_read_conversion, QCpre_write_conversion;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
320 Lisp_Object QCascii_compatible_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
321
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
322 extern Lisp_Object Qinsert_file_contents, Qwrite_region;
64251
3de1b955c31a * coding.c (Qprocess_argument):
Kim F. Storm <storm@cua.dk>
parents: 64084
diff changeset
323 Lisp_Object Qcall_process, Qcall_process_region;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
324 Lisp_Object Qstart_process, Qopen_network_stream;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
325 Lisp_Object Qtarget_idx;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
326
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
327 Lisp_Object Qinsufficient_source, Qinconsistent_eol, Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
328 Lisp_Object Qinterrupted, Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
329
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
330 extern Lisp_Object Qcompletion_ignore_case;
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
331
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
332 /* If a symbol has this property, evaluate the value to define the
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
333 symbol as a coding system. */
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
334 static Lisp_Object Qcoding_system_define_form;
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
335
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
336 int coding_system_require_warning;
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
337
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
338 Lisp_Object Vselect_safe_coding_system_function;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
339
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
340 /* Mnemonic string for each format of end-of-line. */
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
341 Lisp_Object eol_mnemonic_unix, eol_mnemonic_dos, eol_mnemonic_mac;
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
342 /* Mnemonic string to indicate format of end-of-line is not yet
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
343 decided. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
344 Lisp_Object eol_mnemonic_undecided;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
345
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
346 /* Format of end-of-line decided by system. This is Qunix on
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
347 Unix and Mac, Qdos on DOS/Windows.
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
348 This has an effect only for external encoding (i.e. for output to
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
349 file and process), not for in-buffer or Lisp string encoding. */
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
350 static Lisp_Object system_eol_type;
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
351
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
352 #ifdef emacs
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
353
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
354 Lisp_Object Vcoding_system_list, Vcoding_system_alist;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
355
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
356 Lisp_Object Qcoding_system_p, Qcoding_system_error;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
357
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
358 /* Coding system emacs-mule and raw-text are for converting only
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
359 end-of-line format. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
360 Lisp_Object Qemacs_mule, Qraw_text;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
361 Lisp_Object Qutf_8_emacs;
51406
3c675181c3d8 (Qutf_8): New.
Dave Love <fx@gnu.org>
parents: 51356
diff changeset
362
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
363 /* Coding-systems are handed between Emacs Lisp programs and C internal
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
364 routines by the following three variables. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
365 /* Coding-system for reading files and receiving data from process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
366 Lisp_Object Vcoding_system_for_read;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
367 /* Coding-system for writing files and sending data to process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
368 Lisp_Object Vcoding_system_for_write;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
369 /* Coding-system actually used in the latest I/O. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
370 Lisp_Object Vlast_coding_system_used;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
371 /* Set to non-nil when an error is detected while code conversion. */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
372 Lisp_Object Vlast_code_conversion_error;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
373 /* A vector of length 256 which contains information about special
22529
d9eac134a41b Doc fixes.
Karl Heuer <kwzh@gnu.org>
parents: 22502
diff changeset
374 Latin codes (especially for dealing with Microsoft codes). */
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
375 Lisp_Object Vlatin_extra_code_table;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
376
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
377 /* Flag to inhibit code conversion of end-of-line format. */
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
378 int inhibit_eol_conversion;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
379
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
380 /* Flag to inhibit ISO2022 escape sequence detection. */
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
381 int inhibit_iso_escape_detection;
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
382
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
383 /* Flag to make buffer-file-coding-system inherit from process-coding. */
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
384 int inherit_process_coding_system;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
385
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
386 /* Coding system to be used to encode text for terminal display when
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
387 terminal coding system is nil. */
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
388 struct coding_system safe_terminal_coding;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
389
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
390 Lisp_Object Vfile_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
391 Lisp_Object Vprocess_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
392 Lisp_Object Vnetwork_coding_system_alist;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
393
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
394 Lisp_Object Vlocale_coding_system;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
395
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
396 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
397
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
398 /* Flag to tell if we look up translation table on character code
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
399 conversion. */
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
400 Lisp_Object Venable_character_translation;
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
401 /* Standard translation table to look up on decoding (reading). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
402 Lisp_Object Vstandard_translation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
403 /* Standard translation table to look up on encoding (writing). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
404 Lisp_Object Vstandard_translation_table_for_encode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
405
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
406 Lisp_Object Qtranslation_table;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
407 Lisp_Object Qtranslation_table_id;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
408 Lisp_Object Qtranslation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
409 Lisp_Object Qtranslation_table_for_encode;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
410
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
411 /* Alist of charsets vs revision number. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
412 static Lisp_Object Vcharset_revision_table;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
413
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
414 /* Default coding systems used for process I/O. */
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
415 Lisp_Object Vdefault_process_coding_system;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
416
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
417 /* Char table for translating Quail and self-inserting input. */
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
418 Lisp_Object Vtranslation_table_for_input;
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
419
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
420 /* Two special coding systems. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
421 Lisp_Object Vsjis_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
422 Lisp_Object Vbig5_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
423
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
424 /* ISO2022 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
425
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
426 #define CODING_ISO_INITIAL(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
427 (XINT (AREF (AREF (CODING_ID_ATTRS ((coding)->id), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
428 coding_attr_iso_initial), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
429 reg)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
430
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
431
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
432 #define CODING_ISO_REQUEST(coding, charset_id) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
433 ((charset_id <= (coding)->max_charset_id \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
434 ? (coding)->safe_charsets[charset_id] \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
435 : -1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
436
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
437
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
438 #define CODING_ISO_FLAGS(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
439 ((coding)->spec.iso_2022.flags)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
440 #define CODING_ISO_DESIGNATION(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
441 ((coding)->spec.iso_2022.current_designation[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
442 #define CODING_ISO_INVOCATION(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
443 ((coding)->spec.iso_2022.current_invocation[plane])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
444 #define CODING_ISO_SINGLE_SHIFTING(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
445 ((coding)->spec.iso_2022.single_shifting)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
446 #define CODING_ISO_BOL(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
447 ((coding)->spec.iso_2022.bol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
448 #define CODING_ISO_INVOKED_CHARSET(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
449 CODING_ISO_DESIGNATION ((coding), CODING_ISO_INVOCATION ((coding), (plane)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
450
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
451 /* Control characters of ISO2022. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
452 /* code */ /* function */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
453 #define ISO_CODE_LF 0x0A /* line-feed */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
454 #define ISO_CODE_CR 0x0D /* carriage-return */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
455 #define ISO_CODE_SO 0x0E /* shift-out */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
456 #define ISO_CODE_SI 0x0F /* shift-in */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
457 #define ISO_CODE_SS2_7 0x19 /* single-shift-2 for 7-bit code */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
458 #define ISO_CODE_ESC 0x1B /* escape */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
459 #define ISO_CODE_SS2 0x8E /* single-shift-2 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
460 #define ISO_CODE_SS3 0x8F /* single-shift-3 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
461 #define ISO_CODE_CSI 0x9B /* control-sequence-introducer */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
462
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
463 /* All code (1-byte) of ISO2022 is classified into one of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
464 followings. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
465 enum iso_code_class_type
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
466 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
467 ISO_control_0, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
468 0x00..0x1F and 0x7F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
469 following 5 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
470 ISO_shift_out, /* ISO_CODE_SO (0x0E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
471 ISO_shift_in, /* ISO_CODE_SI (0x0F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
472 ISO_single_shift_2_7, /* ISO_CODE_SS2_7 (0x19) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
473 ISO_escape, /* ISO_CODE_SO (0x1B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
474 ISO_control_1, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
475 0x80..0x9F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
476 following 3 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
477 ISO_single_shift_2, /* ISO_CODE_SS2 (0x8E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
478 ISO_single_shift_3, /* ISO_CODE_SS3 (0x8F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
479 ISO_control_sequence_introducer, /* ISO_CODE_CSI (0x9B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
480 ISO_0x20_or_0x7F, /* Codes of the values 0x20 or 0x7F. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
481 ISO_graphic_plane_0, /* Graphic codes in the range 0x21..0x7E. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
482 ISO_0xA0_or_0xFF, /* Codes of the values 0xA0 or 0xFF. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
483 ISO_graphic_plane_1 /* Graphic codes in the range 0xA1..0xFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
484 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
485
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
486 /** The macros CODING_ISO_FLAG_XXX defines a flag bit of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
487 `iso-flags' attribute of an iso2022 coding system. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
488
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
489 /* If set, produce long-form designation sequence (e.g. ESC $ ( A)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
490 instead of the correct short-form sequence (e.g. ESC $ A). */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
491 #define CODING_ISO_FLAG_LONG_FORM 0x0001
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
492
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
493 /* If set, reset graphic planes and registers at end-of-line to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
494 initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
495 #define CODING_ISO_FLAG_RESET_AT_EOL 0x0002
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
496
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
497 /* If set, reset graphic planes and registers before any control
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
498 characters to the initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
499 #define CODING_ISO_FLAG_RESET_AT_CNTL 0x0004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
500
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
501 /* If set, encode by 7-bit environment. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
502 #define CODING_ISO_FLAG_SEVEN_BITS 0x0008
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
503
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
504 /* If set, use locking-shift function. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
505 #define CODING_ISO_FLAG_LOCKING_SHIFT 0x0010
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
506
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
507 /* If set, use single-shift function. Overwrite
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
508 CODING_ISO_FLAG_LOCKING_SHIFT. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
509 #define CODING_ISO_FLAG_SINGLE_SHIFT 0x0020
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
510
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
511 /* If set, use designation escape sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
512 #define CODING_ISO_FLAG_DESIGNATION 0x0040
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
513
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
514 /* If set, produce revision number sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
515 #define CODING_ISO_FLAG_REVISION 0x0080
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
516
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
517 /* If set, produce ISO6429's direction specifying sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
518 #define CODING_ISO_FLAG_DIRECTION 0x0100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
519
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
520 /* If set, assume designation states are reset at beginning of line on
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
521 output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
522 #define CODING_ISO_FLAG_INIT_AT_BOL 0x0200
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
523
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
524 /* If set, designation sequence should be placed at beginning of line
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
525 on output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
526 #define CODING_ISO_FLAG_DESIGNATE_AT_BOL 0x0400
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
527
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
528 /* If set, do not encode unsafe charactes on output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
529 #define CODING_ISO_FLAG_SAFE 0x0800
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
530
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
531 /* If set, extra latin codes (128..159) are accepted as a valid code
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
532 on input. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
533 #define CODING_ISO_FLAG_LATIN_EXTRA 0x1000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
534
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
535 #define CODING_ISO_FLAG_COMPOSITION 0x2000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
536
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
537 #define CODING_ISO_FLAG_EUC_TW_SHIFT 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
538
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
539 #define CODING_ISO_FLAG_USE_ROMAN 0x8000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
540
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
541 #define CODING_ISO_FLAG_USE_OLDJIS 0x10000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
542
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
543 #define CODING_ISO_FLAG_FULL_SUPPORT 0x100000
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
544
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
545 /* A character to be produced on output if encoding of the original
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
546 character is prohibited by CODING_ISO_FLAG_SAFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
547 #define CODING_INHIBIT_CHARACTER_SUBSTITUTION '?'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
548
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
549 /* UTF-8 section */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
550 #define CODING_UTF_8_BOM(coding) \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
551 ((coding)->spec.utf_8_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
552
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
553 /* UTF-16 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
554 #define CODING_UTF_16_BOM(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
555 ((coding)->spec.utf_16.bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
556
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
557 #define CODING_UTF_16_ENDIAN(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
558 ((coding)->spec.utf_16.endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
559
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
560 #define CODING_UTF_16_SURROGATE(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
561 ((coding)->spec.utf_16.surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
562
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
563
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
564 /* CCL section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
565 #define CODING_CCL_DECODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
566 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_decoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
567 #define CODING_CCL_ENCODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
568 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_encoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
569 #define CODING_CCL_VALIDS(coding) \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
570 (SDATA (AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_valids)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
571
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
572 /* Index for each coding category in `coding_categories' */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
573
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
574 enum coding_category
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
575 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
576 coding_category_iso_7,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
577 coding_category_iso_7_tight,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
578 coding_category_iso_8_1,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
579 coding_category_iso_8_2,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
580 coding_category_iso_7_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
581 coding_category_iso_8_else,
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
582 coding_category_utf_8_auto,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
583 coding_category_utf_8_nosig,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
584 coding_category_utf_8_sig,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
585 coding_category_utf_16_auto,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
586 coding_category_utf_16_be,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
587 coding_category_utf_16_le,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
588 coding_category_utf_16_be_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
589 coding_category_utf_16_le_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
590 coding_category_charset,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
591 coding_category_sjis,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
592 coding_category_big5,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
593 coding_category_ccl,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
594 coding_category_emacs_mule,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
595 /* All above are targets of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
596 coding_category_raw_text,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
597 coding_category_undecided,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
598 coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
599 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
600
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
601 /* Definitions of flag bits used in detect_coding_XXXX. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
602 #define CATEGORY_MASK_ISO_7 (1 << coding_category_iso_7)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
603 #define CATEGORY_MASK_ISO_7_TIGHT (1 << coding_category_iso_7_tight)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
604 #define CATEGORY_MASK_ISO_8_1 (1 << coding_category_iso_8_1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
605 #define CATEGORY_MASK_ISO_8_2 (1 << coding_category_iso_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
606 #define CATEGORY_MASK_ISO_7_ELSE (1 << coding_category_iso_7_else)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
607 #define CATEGORY_MASK_ISO_8_ELSE (1 << coding_category_iso_8_else)
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
608 #define CATEGORY_MASK_UTF_8_AUTO (1 << coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
609 #define CATEGORY_MASK_UTF_8_NOSIG (1 << coding_category_utf_8_nosig)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
610 #define CATEGORY_MASK_UTF_8_SIG (1 << coding_category_utf_8_sig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
611 #define CATEGORY_MASK_UTF_16_AUTO (1 << coding_category_utf_16_auto)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
612 #define CATEGORY_MASK_UTF_16_BE (1 << coding_category_utf_16_be)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
613 #define CATEGORY_MASK_UTF_16_LE (1 << coding_category_utf_16_le)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
614 #define CATEGORY_MASK_UTF_16_BE_NOSIG (1 << coding_category_utf_16_be_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
615 #define CATEGORY_MASK_UTF_16_LE_NOSIG (1 << coding_category_utf_16_le_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
616 #define CATEGORY_MASK_CHARSET (1 << coding_category_charset)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
617 #define CATEGORY_MASK_SJIS (1 << coding_category_sjis)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
618 #define CATEGORY_MASK_BIG5 (1 << coding_category_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
619 #define CATEGORY_MASK_CCL (1 << coding_category_ccl)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
620 #define CATEGORY_MASK_EMACS_MULE (1 << coding_category_emacs_mule)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
621 #define CATEGORY_MASK_RAW_TEXT (1 << coding_category_raw_text)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
622
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
623 /* This value is returned if detect_coding_mask () find nothing other
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
624 than ASCII characters. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
625 #define CATEGORY_MASK_ANY \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
626 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
627 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
628 | CATEGORY_MASK_ISO_8_1 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
629 | CATEGORY_MASK_ISO_8_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
630 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
631 | CATEGORY_MASK_ISO_8_ELSE \
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
632 | CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
633 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
634 | CATEGORY_MASK_UTF_8_SIG \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
635 | CATEGORY_MASK_UTF_16_AUTO \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
636 | CATEGORY_MASK_UTF_16_BE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
637 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
638 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
639 | CATEGORY_MASK_UTF_16_LE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
640 | CATEGORY_MASK_CHARSET \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
641 | CATEGORY_MASK_SJIS \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
642 | CATEGORY_MASK_BIG5 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
643 | CATEGORY_MASK_CCL \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
644 | CATEGORY_MASK_EMACS_MULE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
645
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
646
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
647 #define CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
648 (CATEGORY_MASK_ISO_7 | CATEGORY_MASK_ISO_7_TIGHT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
649
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
650 #define CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
651 (CATEGORY_MASK_ISO_8_1 | CATEGORY_MASK_ISO_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
652
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
653 #define CATEGORY_MASK_ISO_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
654 (CATEGORY_MASK_ISO_7_ELSE | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
655
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
656 #define CATEGORY_MASK_ISO_ESCAPE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
657 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
658 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
659 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
660 | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
661
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
662 #define CATEGORY_MASK_ISO \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
663 ( CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
664 | CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
665 | CATEGORY_MASK_ISO_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
666
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
667 #define CATEGORY_MASK_UTF_16 \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
668 (CATEGORY_MASK_UTF_16_AUTO \
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
669 | CATEGORY_MASK_UTF_16_BE \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
670 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
671 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
672 | CATEGORY_MASK_UTF_16_LE_NOSIG)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
673
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
674 #define CATEGORY_MASK_UTF_8 \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
675 (CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
676 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
677 | CATEGORY_MASK_UTF_8_SIG)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
678
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
679 /* List of symbols `coding-category-xxx' ordered by priority. This
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
680 variable is exposed to Emacs Lisp. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
681 static Lisp_Object Vcoding_category_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
682
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
683 /* Table of coding categories (Lisp symbols). This variable is for
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
684 internal use oly. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
685 static Lisp_Object Vcoding_category_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
686
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
687 /* Table of coding-categories ordered by priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
688 static enum coding_category coding_priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
689
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
690 /* Nth element is a coding context for the coding system bound to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
691 Nth coding category. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
692 static struct coding_system coding_categories[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
693
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
694 /*** Commonly used macros and functions ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
695
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
696 #ifndef min
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
697 #define min(a, b) ((a) < (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
698 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
699 #ifndef max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
700 #define max(a, b) ((a) > (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
701 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
702
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
703 #define CODING_GET_INFO(coding, attrs, charset_list) \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
704 do { \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
705 (attrs) = CODING_ID_ATTRS ((coding)->id); \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
706 (charset_list) = CODING_ATTR_CHARSET_LIST (attrs); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
707 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
708
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
709
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
710 /* Safely get one byte from the source text pointed by SRC which ends
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
711 at SRC_END, and set C to that byte. If there are not enough bytes
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
712 in the source, it jumps to `no_more_source'. If multibytep is
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
713 nonzero, and a multibyte character is found at SRC, set C to the
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
714 negative value of the character code. The caller should declare
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
715 and set these variables appropriately in advance:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
716 src, src_end, multibytep */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
717
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
718 #define ONE_MORE_BYTE(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
719 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
720 if (src == src_end) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
721 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
722 if (src_base < src) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
723 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
724 (coding, CODING_RESULT_INSUFFICIENT_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
725 goto no_more_source; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
726 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
727 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
728 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
729 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
730 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
731 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
732 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
733 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
734 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
735 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
736 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
737 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
738 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
739 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
740 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
741 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
742
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
743
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
744 #define ONE_MORE_BYTE_NO_CHECK(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
745 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
746 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
747 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
748 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
749 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
750 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
751 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
752 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
753 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
754 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
755 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
756 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
757 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
758 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
759 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
760 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
761
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
762
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
763 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
764 next free point, and increment PRODUCED_CHARS. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
765 assure that C is 0..127, and declare and set the variable `dst'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
766 appropriately in advance.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
767 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
768
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
769
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
770 #define EMIT_ONE_ASCII_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
771 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
772 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
773 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
774 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
775
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
776
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
777 /* Like EMIT_ONE_ASCII_BYTE byt store two bytes; C1 and C2. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
778
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
779 #define EMIT_TWO_ASCII_BYTES(c1, c2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
780 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
781 produced_chars += 2; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
782 *dst++ = (c1), *dst++ = (c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
783 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
784
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
785
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
786 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
787 next free point, and increment PRODUCED_CHARS. If MULTIBYTEP is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
788 nonzero, store in an appropriate multibyte from. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
789 declare and set the variables `dst' and `multibytep' appropriately
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
790 in advance. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
791
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
792 #define EMIT_ONE_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
793 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
794 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
795 if (multibytep) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
796 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
797 int ch = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
798 if (ch >= 0x80) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
799 ch = BYTE8_TO_CHAR (ch); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
800 CHAR_STRING_ADVANCE (ch, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
801 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
802 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
803 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
804 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
805
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
806
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
807 /* Like EMIT_ONE_BYTE, but emit two bytes; C1 and C2. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
808
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
809 #define EMIT_TWO_BYTES(c1, c2) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
810 do { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
811 produced_chars += 2; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
812 if (multibytep) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
813 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
814 int ch; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
815 \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
816 ch = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
817 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
818 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
819 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
820 ch = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
821 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
822 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
823 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
824 } \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
825 else \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
826 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
827 *dst++ = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
828 *dst++ = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
829 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
830 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
831
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
832
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
833 #define EMIT_THREE_BYTES(c1, c2, c3) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
834 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
835 EMIT_ONE_BYTE (c1); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
836 EMIT_TWO_BYTES (c2, c3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
837 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
838
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
839
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
840 #define EMIT_FOUR_BYTES(c1, c2, c3, c4) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
841 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
842 EMIT_TWO_BYTES (c1, c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
843 EMIT_TWO_BYTES (c3, c4); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
844 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
845
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
846
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
847 /* Prototypes for static functions. */
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
848 static void record_conversion_result P_ ((struct coding_system *coding,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
849 enum coding_result_code result));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
850 static int detect_coding_utf_8 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
851 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
852 static void decode_coding_utf_8 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
853 static int encode_coding_utf_8 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
854
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
855 static int detect_coding_utf_16 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
856 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
857 static void decode_coding_utf_16 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
858 static int encode_coding_utf_16 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
859
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
860 static int detect_coding_iso_2022 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
861 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
862 static void decode_coding_iso_2022 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
863 static int encode_coding_iso_2022 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
864
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
865 static int detect_coding_emacs_mule P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
866 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
867 static void decode_coding_emacs_mule P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
868 static int encode_coding_emacs_mule P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
869
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
870 static int detect_coding_sjis P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
871 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
872 static void decode_coding_sjis P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
873 static int encode_coding_sjis P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
874
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
875 static int detect_coding_big5 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
876 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
877 static void decode_coding_big5 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
878 static int encode_coding_big5 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
879
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
880 static int detect_coding_ccl P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
881 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
882 static void decode_coding_ccl P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
883 static int encode_coding_ccl P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
884
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
885 static void decode_coding_raw_text P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
886 static int encode_coding_raw_text P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
887
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
888 static void coding_set_source P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
889 static void coding_set_destination P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
890 static void coding_alloc_by_realloc P_ ((struct coding_system *, EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
891 static void coding_alloc_by_making_gap P_ ((struct coding_system *,
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
892 EMACS_INT, EMACS_INT));
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
893 static unsigned char *alloc_destination P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
894 EMACS_INT, unsigned char *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
895 static void setup_iso_safe_charsets P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
896 static unsigned char *encode_designation_at_bol P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
897 int *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
898 unsigned char *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
899 static int detect_eol P_ ((const unsigned char *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
900 EMACS_INT, enum coding_category));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
901 static Lisp_Object adjust_coding_eol_type P_ ((struct coding_system *, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
902 static void decode_eol P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
903 static Lisp_Object get_translation_table P_ ((Lisp_Object, int, int *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
904 static Lisp_Object get_translation P_ ((Lisp_Object, int *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
905 int, int *, int *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
906 static int produce_chars P_ ((struct coding_system *, Lisp_Object, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
907 static INLINE void produce_composition P_ ((struct coding_system *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
908 EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
909 static INLINE void produce_charset P_ ((struct coding_system *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
910 EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
911 static void produce_annotation P_ ((struct coding_system *, EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
912 static int decode_coding P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
913 static INLINE int *handle_composition_annotation P_ ((EMACS_INT, EMACS_INT,
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
914 struct coding_system *,
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
915 int *, EMACS_INT *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
916 static INLINE int *handle_charset_annotation P_ ((EMACS_INT, EMACS_INT,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
917 struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
918 int *, EMACS_INT *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
919 static void consume_chars P_ ((struct coding_system *, Lisp_Object, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
920 static int encode_coding P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
921 static Lisp_Object make_conversion_work_buffer P_ ((int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
922 static Lisp_Object code_conversion_restore P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
923 static INLINE int char_encodable_p P_ ((int, Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
924 static Lisp_Object make_subsidiaries P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
925
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
926 static void
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
927 record_conversion_result (struct coding_system *coding,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
928 enum coding_result_code result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
929 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
930 coding->result = result;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
931 switch (result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
932 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
933 case CODING_RESULT_INSUFFICIENT_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
934 Vlast_code_conversion_error = Qinsufficient_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
935 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
936 case CODING_RESULT_INCONSISTENT_EOL:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
937 Vlast_code_conversion_error = Qinconsistent_eol;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
938 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
939 case CODING_RESULT_INVALID_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
940 Vlast_code_conversion_error = Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
941 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
942 case CODING_RESULT_INTERRUPT:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
943 Vlast_code_conversion_error = Qinterrupted;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
944 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
945 case CODING_RESULT_INSUFFICIENT_MEM:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
946 Vlast_code_conversion_error = Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
947 break;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
948 default:
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
949 Vlast_code_conversion_error = intern ("Unknown error");
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
950 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
951 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
952
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
953 #define CODING_DECODE_CHAR(coding, src, src_base, src_end, charset, code, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
954 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
955 charset_map_loaded = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
956 c = DECODE_CHAR (charset, code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
957 if (charset_map_loaded) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
958 { \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
959 const unsigned char *orig = coding->source; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
960 EMACS_INT offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
961 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
962 coding_set_source (coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
963 offset = coding->source - orig; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
964 src += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
965 src_base += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
966 src_end += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
967 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
968 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
969
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
970
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
971 /* If there are at least BYTES length of room at dst, allocate memory
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
972 for coding->destination and update dst and dst_end. We don't have
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
973 to take care of coding->source which will be relocated. It is
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
974 handled by calling coding_set_source in encode_coding. */
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
975
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
976 #define ASSURE_DESTINATION(bytes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
977 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
978 if (dst + (bytes) >= dst_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
979 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
980 int more_bytes = charbuf_end - charbuf + (bytes); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
981 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
982 dst = alloc_destination (coding, more_bytes, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
983 dst_end = coding->destination + coding->dst_bytes; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
984 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
985 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
986
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
987
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
988 /* Store multibyte form of the character C in P, and advance P to the
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
989 end of the multibyte form. This is like CHAR_STRING_ADVANCE but it
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
990 never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
991
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
992 #define CHAR_STRING_ADVANCE_NO_UNIFY(c, p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
993 do { \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
994 if ((c) <= MAX_1_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
995 *(p)++ = (c); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
996 else if ((c) <= MAX_2_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
997 *(p)++ = (0xC0 | ((c) >> 6)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
998 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
999 else if ((c) <= MAX_3_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1000 *(p)++ = (0xE0 | ((c) >> 12)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1001 *(p)++ = (0x80 | (((c) >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1002 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1003 else if ((c) <= MAX_4_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1004 *(p)++ = (0xF0 | (c >> 18)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1005 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1006 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1007 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1008 else if ((c) <= MAX_5_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1009 *(p)++ = 0xF8, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1010 *(p)++ = (0x80 | ((c >> 18) & 0x0F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1011 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1012 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1013 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1014 else \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1015 (p) += BYTE8_STRING ((c) - 0x3FFF80, p); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1016 } while (0)
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1017
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1018
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1019 /* Return the character code of character whose multibyte form is at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1020 P, and advance P to the end of the multibyte form. This is like
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1021 STRING_CHAR_ADVANCE, but it never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1022
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1023 #define STRING_CHAR_ADVANCE_NO_UNIFY(p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1024 (!((p)[0] & 0x80) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1025 ? *(p)++ \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1026 : ! ((p)[0] & 0x20) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1027 ? ((p) += 2, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1028 ((((p)[-2] & 0x1F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1029 | ((p)[-1] & 0x3F) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1030 | ((unsigned char) ((p)[-2]) < 0xC2 ? 0x3FFF80 : 0))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1031 : ! ((p)[0] & 0x10) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1032 ? ((p) += 3, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1033 ((((p)[-3] & 0x0F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1034 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1035 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1036 : ! ((p)[0] & 0x08) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1037 ? ((p) += 4, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1038 ((((p)[-4] & 0xF) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1039 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1040 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1041 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1042 : ((p) += 5, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1043 ((((p)[-4] & 0x3F) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1044 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1045 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1046 | ((p)[-1] & 0x3F))))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1047
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1048
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1049 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1050 coding_set_source (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1051 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1052 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1053 if (BUFFERP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1054 {
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1055 struct buffer *buf = XBUFFER (coding->src_object);
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1056
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1057 if (coding->src_pos < 0)
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1058 coding->source = BUF_GAP_END_ADDR (buf) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1059 else
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1060 coding->source = BUF_BYTE_ADDRESS (buf, coding->src_pos_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1061 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1062 else if (STRINGP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1063 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1064 coding->source = SDATA (coding->src_object) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1065 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1066 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1067 /* Otherwise, the source is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1068 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1069 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1070 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1071
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1072 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1073 coding_set_destination (coding)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1074 struct coding_system *coding;
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1075 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1076 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1077 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1078 if (coding->src_pos < 0)
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1079 {
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1080 coding->destination = BEG_ADDR + coding->dst_pos_byte - BEG_BYTE;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1081 coding->dst_bytes = (GAP_END_ADDR
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1082 - (coding->src_bytes - coding->consumed)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1083 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1084 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1085 else
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1086 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1087 /* We are sure that coding->dst_pos_byte is before the gap
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1088 of the buffer. */
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1089 coding->destination = (BUF_BEG_ADDR (XBUFFER (coding->dst_object))
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1090 + coding->dst_pos_byte - BEG_BYTE);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1091 coding->dst_bytes = (BUF_GAP_END_ADDR (XBUFFER (coding->dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1092 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1093 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1094 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1095 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1096 /* Otherwise, the destination is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1097 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1098 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1099 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1101
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1102 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1103 coding_alloc_by_realloc (coding, bytes)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1104 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1105 EMACS_INT bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1106 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1107 coding->destination = (unsigned char *) xrealloc (coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1108 coding->dst_bytes + bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1109 coding->dst_bytes += bytes;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1110 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1111
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1112 static void
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1113 coding_alloc_by_making_gap (coding, gap_head_used, bytes)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1114 struct coding_system *coding;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1115 EMACS_INT gap_head_used, bytes;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1116 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1117 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1118 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1119 /* The gap may contain the produced data at the head and not-yet
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1120 consumed data at the tail. To preserve those data, we at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1121 first make the gap size to zero, then increase the gap
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1122 size. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1123 EMACS_INT add = GAP_SIZE;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1124
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1125 GPT += gap_head_used, GPT_BYTE += gap_head_used;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1126 GAP_SIZE = 0; ZV += add; Z += add; ZV_BYTE += add; Z_BYTE += add;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1127 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1128 GAP_SIZE += add; ZV -= add; Z -= add; ZV_BYTE -= add; Z_BYTE -= add;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1129 GPT -= gap_head_used, GPT_BYTE -= gap_head_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1130 }
90292
697c08d95af7 Cancel incorrect synching with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90291
diff changeset
1131 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1132 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1133 Lisp_Object this_buffer;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1134
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1135 this_buffer = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1136 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1137 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1138 set_buffer_internal (XBUFFER (this_buffer));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1139 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1140 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1141
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1142
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1143 static unsigned char *
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1144 alloc_destination (coding, nbytes, dst)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1145 struct coding_system *coding;
89545
4f394eed6ff2 (inhibit_pre_post_conversion): Removed (unused).
Dave Love <fx@gnu.org>
parents: 89519
diff changeset
1146 EMACS_INT nbytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1147 unsigned char *dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1148 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1149 EMACS_INT offset = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1150
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1151 if (BUFFERP (coding->dst_object))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1152 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1153 struct buffer *buf = XBUFFER (coding->dst_object);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1154
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1155 coding_alloc_by_making_gap (coding, dst - BUF_GPT_ADDR (buf), nbytes);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1156 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1157 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1158 coding_alloc_by_realloc (coding, nbytes);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1159 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1160 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1161 dst = coding->destination + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1162 return dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1163 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1164
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1165 /** Macros for annotations. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1166
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1167 /* Maximum length of annotation data (sum of annotations for
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1168 composition and charset). */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1169 #define MAX_ANNOTATION_LENGTH (4 + (MAX_COMPOSITION_COMPONENTS * 2) - 1 + 4)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1170
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1171 /* An annotation data is stored in the array coding->charbuf in this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1172 format:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1173 [ -LENGTH ANNOTATION_MASK NCHARS ... ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1174 LENGTH is the number of elements in the annotation.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1175 ANNOTATION_MASK is one of CODING_ANNOTATE_XXX_MASK.
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1176 NCHARS is the number of characters in the text annotated.
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1177
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1178 The format of the following elements depend on ANNOTATION_MASK.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1179
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1180 In the case of CODING_ANNOTATE_COMPOSITION_MASK, these elements
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1181 follows:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1182 ... METHOD [ COMPOSITION-COMPONENTS ... ]
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1183 METHOD is one of enum composition_method.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1184 Optionnal COMPOSITION-COMPONENTS are characters and composition
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1185 rules.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1186
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1187 In the case of CODING_ANNOTATE_CHARSET_MASK, one element CHARSET-ID
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1188 follows. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1189
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1190 #define ADD_ANNOTATION_DATA(buf, len, mask, nchars) \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1191 do { \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1192 *(buf)++ = -(len); \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1193 *(buf)++ = (mask); \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1194 *(buf)++ = (nchars); \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1195 coding->annotated = 1; \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1196 } while (0);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1197
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1198 #define ADD_COMPOSITION_DATA(buf, nchars, method) \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1199 do { \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1200 ADD_ANNOTATION_DATA (buf, 4, CODING_ANNOTATE_COMPOSITION_MASK, nchars); \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1201 *buf++ = method; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1202 } while (0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1203
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1204
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1205 #define ADD_CHARSET_DATA(buf, nchars, id) \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1206 do { \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1207 ADD_ANNOTATION_DATA (buf, 4, CODING_ANNOTATE_CHARSET_MASK, nchars); \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1208 *buf++ = id; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1209 } while (0)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1210
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1211
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1212 /*** 2. Emacs' internal format (emacs-utf-8) ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1213
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1214
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1215
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1216
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1217 /*** 3. UTF-8 ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1218
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1219 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1220 Check if a text is encoded in UTF-8. If it is, return 1, else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1221 return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1222
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1223 #define UTF_8_1_OCTET_P(c) ((c) < 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1224 #define UTF_8_EXTRA_OCTET_P(c) (((c) & 0xC0) == 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1225 #define UTF_8_2_OCTET_LEADING_P(c) (((c) & 0xE0) == 0xC0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1226 #define UTF_8_3_OCTET_LEADING_P(c) (((c) & 0xF0) == 0xE0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1227 #define UTF_8_4_OCTET_LEADING_P(c) (((c) & 0xF8) == 0xF0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1228 #define UTF_8_5_OCTET_LEADING_P(c) (((c) & 0xFC) == 0xF8)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1229
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1230 #define UTF_BOM 0xFEFF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1231 #define UTF_8_BOM_1 0xEF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1232 #define UTF_8_BOM_2 0xBB
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1233 #define UTF_8_BOM_3 0xBF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1234
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1235 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1236 detect_coding_utf_8 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1237 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1238 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1239 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1240 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1241 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1242 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1243 int consumed_chars = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1244 int bom_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1245 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1246
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1247 detect_info->checked |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1248 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1249 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1250
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1251 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1252 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1253 int c, c1, c2, c3, c4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1254
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1255 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1256 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1257 if (c < 0 || UTF_8_1_OCTET_P (c))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1258 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1259 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1260 if (c1 < 0 || ! UTF_8_EXTRA_OCTET_P (c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1261 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1262 if (UTF_8_2_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1263 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1264 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1265 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1266 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1267 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1268 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1269 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1270 if (UTF_8_3_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1271 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1272 found = 1;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1273 if (src_base == coding->source
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1274 && c == UTF_8_BOM_1 && c1 == UTF_8_BOM_2 && c2 == UTF_8_BOM_3)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1275 bom_found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1276 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1277 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1278 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1279 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1280 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1281 if (UTF_8_4_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1282 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1283 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1284 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1285 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1286 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1287 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1288 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1289 if (UTF_8_5_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1290 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1291 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1292 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1293 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1294 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1295 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1296 detect_info->rejected |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1297 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1298
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1299 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1300 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1301 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1302 detect_info->rejected |= CATEGORY_MASK_UTF_8;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1303 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1304 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1305 if (bom_found)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1306 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1307 /* The first character 0xFFFE doesn't necessarily mean a BOM. */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1308 detect_info->found |= CATEGORY_MASK_UTF_8_SIG | CATEGORY_MASK_UTF_8_NOSIG;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1309 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1310 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1311 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1312 detect_info->rejected |= CATEGORY_MASK_UTF_8_SIG;
96571
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1313 if (found)
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1314 detect_info->found |= CATEGORY_MASK_UTF_8_NOSIG;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1315 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1316 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1317 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1318
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1319
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1320 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1321 decode_coding_utf_8 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1322 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1323 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1324 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1325 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1326 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1327 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1328 int *charbuf_end = coding->charbuf + coding->charbuf_size;
100133
bca35d7cb3ac (decode_coding_utf_8): Likewise.
Kenichi Handa <handa@m17n.org>
parents: 100131
diff changeset
1329 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1330 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1331 enum utf_bom_type bom = CODING_UTF_8_BOM (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1332 Lisp_Object attr, charset_list;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1333 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1334 int byte_after_cr = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1335
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1336 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1337
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1338 if (bom != utf_without_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1339 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1340 int c1, c2, c3;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1341
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1342 src_base = src;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1343 ONE_MORE_BYTE (c1);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1344 if (! UTF_8_3_OCTET_LEADING_P (c1))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1345 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1346 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1347 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1348 ONE_MORE_BYTE (c2);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1349 if (! UTF_8_EXTRA_OCTET_P (c2))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1350 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1351 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1352 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1353 ONE_MORE_BYTE (c3);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1354 if (! UTF_8_EXTRA_OCTET_P (c3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1355 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1356 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1357 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1358 if ((c1 != UTF_8_BOM_1)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1359 || (c2 != UTF_8_BOM_2) || (c3 != UTF_8_BOM_3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1360 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1361 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1362 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1363 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1364 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1365 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1366 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1367 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1368
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1369
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1370
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1371 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1372 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1373 int c, c1, c2, c3, c4, c5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1374
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1375 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1376 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1377
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1378 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1379 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1380
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1381 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1382 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1383 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1384 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1385 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1386 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1387 c = - c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1388 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1389 else if (UTF_8_1_OCTET_P(c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1390 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1391 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1392 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1393 c = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1394 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1395 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1396 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1397 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1398 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1399 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1400 if (UTF_8_2_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1401 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1402 c = ((c1 & 0x1F) << 6) | (c2 & 0x3F);
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1403 /* Reject overlong sequences here and below. Encoders
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1404 producing them are incorrect, they can be misleading,
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1405 and they mess up read/write invariance. */
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1406 if (c < 128)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1407 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1408 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1409 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1410 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1411 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1412 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1413 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1414 if (UTF_8_3_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1415 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1416 c = (((c1 & 0xF) << 12)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1417 | ((c2 & 0x3F) << 6) | (c3 & 0x3F));
89184
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1418 if (c < 0x800
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1419 || (c >= 0xd800 && c < 0xe000)) /* surrogates (invalid) */
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1420 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1421 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1422 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1423 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1424 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1425 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1426 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1427 if (UTF_8_4_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1428 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1429 c = (((c1 & 0x7) << 18) | ((c2 & 0x3F) << 12)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1430 | ((c3 & 0x3F) << 6) | (c4 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1431 if (c < 0x10000)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1432 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1433 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1434 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1435 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1436 ONE_MORE_BYTE (c5);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1437 if (c5 < 0 || ! UTF_8_EXTRA_OCTET_P (c5))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1438 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1439 if (UTF_8_5_OCTET_LEADING_P (c1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1440 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1441 c = (((c1 & 0x3) << 24) | ((c2 & 0x3F) << 18)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1442 | ((c3 & 0x3F) << 12) | ((c4 & 0x3F) << 6)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1443 | (c5 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1444 if ((c > MAX_CHAR) || (c < 0x200000))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1445 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1446 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1447 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1448 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1449 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1450 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1451 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1452 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1453
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1454 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1455 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1456
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1457 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1458 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1459 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1460 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1461 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1462 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1463 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1464
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1465 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1466 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1467 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1468 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1469 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1470
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1471
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1472 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1473 encode_coding_utf_8 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1474 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1475 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1476 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1477 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1478 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1479 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1480 unsigned char *dst_end = coding->destination + coding->dst_bytes;
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1481 int produced_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1482 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1483
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1484 if (CODING_UTF_8_BOM (coding) == utf_with_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1485 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1486 ASSURE_DESTINATION (3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1487 EMIT_THREE_BYTES (UTF_8_BOM_1, UTF_8_BOM_2, UTF_8_BOM_3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1488 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1489 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1490
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1491 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1492 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1493 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1494
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1495 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1496 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1497 unsigned char str[MAX_MULTIBYTE_LENGTH], *p, *pend = str;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1498
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1499 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1500 c = *charbuf++;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1501 if (CHAR_BYTE8_P (c))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1502 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1503 c = CHAR_TO_BYTE8 (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1504 EMIT_ONE_BYTE (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1505 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1506 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1507 {
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1508 CHAR_STRING_ADVANCE_NO_UNIFY (c, pend);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1509 for (p = str; p < pend; p++)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1510 EMIT_ONE_BYTE (*p);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1511 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1512 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1513 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1514 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1515 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1516 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1517
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1518 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1519 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1520 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1521 c = *charbuf++;
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1522 if (CHAR_BYTE8_P (c))
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1523 *dst++ = CHAR_TO_BYTE8 (c);
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1524 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1525 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1526 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1527 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1528 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1529 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1530 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1531 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1532 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1533 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1534
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1535
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1536 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1537 Check if a text is encoded in one of UTF-16 based coding systems.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1538 If it is, return 1, else return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1539
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1540 #define UTF_16_HIGH_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1541 (((val) & 0xFC00) == 0xD800)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1542
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1543 #define UTF_16_LOW_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1544 (((val) & 0xFC00) == 0xDC00)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1545
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1546 #define UTF_16_INVALID_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1547 (((val) == 0xFFFE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1548 || ((val) == 0xFFFF) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1549 || UTF_16_LOW_SURROGATE_P (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1550
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1551
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1552 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1553 detect_coding_utf_16 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1554 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1555 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1556 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1557 const unsigned char *src = coding->source, *src_base = src;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1558 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1559 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1560 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1561 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1562
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1563 detect_info->checked |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1564 if (coding->mode & CODING_MODE_LAST_BLOCK
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1565 && (coding->src_chars & 1))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1566 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1567 detect_info->rejected |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1568 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1569 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1570
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1571 ONE_MORE_BYTE (c1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1572 ONE_MORE_BYTE (c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1573 if ((c1 == 0xFF) && (c2 == 0xFE))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1574 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1575 detect_info->found |= (CATEGORY_MASK_UTF_16_LE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1576 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1577 detect_info->rejected |= (CATEGORY_MASK_UTF_16_BE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1578 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1579 | CATEGORY_MASK_UTF_16_LE_NOSIG);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1580 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1581 else if ((c1 == 0xFE) && (c2 == 0xFF))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1582 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1583 detect_info->found |= (CATEGORY_MASK_UTF_16_BE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1584 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1585 detect_info->rejected |= (CATEGORY_MASK_UTF_16_LE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1586 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1587 | CATEGORY_MASK_UTF_16_LE_NOSIG);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1588 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1589 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1590 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1591 /* We check the dispersion of Eth and Oth bytes where E is even and
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1592 O is odd. If both are high, we assume binary data.*/
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1593 unsigned char e[256], o[256];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1594 unsigned e_num = 1, o_num = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1596 memset (e, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1597 memset (o, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1598 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1599 o[c2] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1600
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1601 detect_info->rejected
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1602 |= (CATEGORY_MASK_UTF_16_BE | CATEGORY_MASK_UTF_16_LE);
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1603
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1604 while (1)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1605 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1606 ONE_MORE_BYTE (c1);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1607 ONE_MORE_BYTE (c2);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1608 if (! e[c1])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1609 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1610 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1611 e_num++;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1612 if (e_num >= 128)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1613 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1614 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1615 if (! o[c2])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1616 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1617 o[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1618 o_num++;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1619 if (o_num >= 128)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1620 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1621 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1622 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1623 detect_info->rejected |= CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1624 return 0;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1625 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1626
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1627 no_more_source:
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1628 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1629 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1630
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1631 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1632 decode_coding_utf_16 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1633 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1634 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1635 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1636 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1637 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1638 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1639 int *charbuf_end = coding->charbuf + coding->charbuf_size;
100131
0e4115b39b5d (decode_coding_utf_16): Initialize consumed_chars_base
Kenichi Handa <handa@m17n.org>
parents: 99753
diff changeset
1640 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1641 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1642 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1643 enum utf_16_endian_type endian = CODING_UTF_16_ENDIAN (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1644 int surrogate = CODING_UTF_16_SURROGATE (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1645 Lisp_Object attr, charset_list;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1646 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1647 int byte_after_cr1 = -1, byte_after_cr2 = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1648
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1649 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1650
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1651 if (bom == utf_with_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1652 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1653 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1654
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1655 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1656 ONE_MORE_BYTE (c1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1657 ONE_MORE_BYTE (c2);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1658 c = (c1 << 8) | c2;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1659
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1660 if (endian == utf_16_big_endian
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1661 ? c != 0xFEFF : c != 0xFFFE)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1662 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1663 /* The first two bytes are not BOM. Treat them as bytes
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1664 for a normal character. */
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1665 src = src_base;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1666 coding->errors++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1667 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1668 CODING_UTF_16_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1669 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1670 else if (bom == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1671 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1672 /* We have already tried to detect BOM and failed in
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1673 detect_coding. */
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1674 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1675 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1676
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1677 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1678 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1679 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1680
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1681 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1682 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1683
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1684 if (charbuf + 2 >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1685 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1686
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1687 if (byte_after_cr1 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1688 c1 = byte_after_cr1, byte_after_cr1 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1689 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1690 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1691 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1692 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1693 *charbuf++ = -c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1694 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1695 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1696 if (byte_after_cr2 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1697 c2 = byte_after_cr2, byte_after_cr2 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1698 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1699 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1700 if (c2 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1701 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1702 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1703 *charbuf++ = -c2;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1704 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1705 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1706 c = (endian == utf_16_big_endian
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1707 ? ((c1 << 8) | c2) : ((c2 << 8) | c1));
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1708
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1709 if (surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1710 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1711 if (! UTF_16_LOW_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1712 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1713 if (endian == utf_16_big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1714 c1 = surrogate >> 8, c2 = surrogate & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1715 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1716 c1 = surrogate & 0xFF, c2 = surrogate >> 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1717 *charbuf++ = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1718 *charbuf++ = c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1719 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1720 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1721 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1722 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1723 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1724 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1725 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1726 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1727 c = ((surrogate - 0xD800) << 10) | (c - 0xDC00);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1728 CODING_UTF_16_SURROGATE (coding) = surrogate = 0;
89842
b5f22f538c1f (decode_coding_utf_16): Fix handling of surrogate pare.
Kenichi Handa <handa@m17n.org>
parents: 89780
diff changeset
1729 *charbuf++ = 0x10000 + c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1730 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1731 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1732 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1733 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1734 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1735 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1736 else
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1737 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1738 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1739 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1740 ONE_MORE_BYTE (byte_after_cr1);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1741 ONE_MORE_BYTE (byte_after_cr2);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1742 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1743 *charbuf++ = c;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1744 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1745 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1746 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1747
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1748 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1749 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1750 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1751 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1752 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1753
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1754 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1755 encode_coding_utf_16 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1756 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1757 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1758 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1759 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1760 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1761 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1762 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1763 int safe_room = 8;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1764 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1765 int big_endian = CODING_UTF_16_ENDIAN (coding) == utf_16_big_endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1766 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1767 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1768 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1769
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1770 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1771
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1772 if (bom != utf_without_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1773 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1774 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1775 if (big_endian)
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1776 EMIT_TWO_BYTES (0xFE, 0xFF);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1777 else
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1778 EMIT_TWO_BYTES (0xFF, 0xFE);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1779 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1780 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1781
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1782 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1783 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1784 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1785 c = *charbuf++;
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1786 if (c >= MAX_UNICODE_CHAR)
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1787 c = coding->default_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1788
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1789 if (c < 0x10000)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1790 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1791 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1792 EMIT_TWO_BYTES (c >> 8, c & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1793 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1794 EMIT_TWO_BYTES (c & 0xFF, c >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1795 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1796 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1797 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1798 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1799
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1800 c -= 0x10000;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1801 c1 = (c >> 10) + 0xD800;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1802 c2 = (c & 0x3FF) + 0xDC00;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1803 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1804 EMIT_FOUR_BYTES (c1 >> 8, c1 & 0xFF, c2 >> 8, c2 & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1805 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1806 EMIT_FOUR_BYTES (c1 & 0xFF, c1 >> 8, c2 & 0xFF, c2 >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1807 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1808 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1809 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1810 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1811 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1812 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1813 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1814
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1815
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1816 /*** 6. Old Emacs' internal format (emacs-mule) ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1817
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1818 /* Emacs' internal format for representation of multiple character
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1819 sets is a kind of multi-byte encoding, i.e. characters are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1820 represented by variable-length sequences of one-byte codes.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1821
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1822 ASCII characters and control characters (e.g. `tab', `newline') are
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1823 represented by one-byte sequences which are their ASCII codes, in
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1824 the range 0x00 through 0x7F.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1825
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1826 8-bit characters of the range 0x80..0x9F are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1827 two-byte sequences of LEADING_CODE_8_BIT_CONTROL and (their 8-bit
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1828 code + 0x20).
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1829
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1830 8-bit characters of the range 0xA0..0xFF are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1831 one-byte sequences which are their 8-bit code.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1832
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1833 The other characters are represented by a sequence of `base
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1834 leading-code', optional `extended leading-code', and one or two
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1835 `position-code's. The length of the sequence is determined by the
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1836 base leading-code. Leading-code takes the range 0x81 through 0x9D,
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1837 whereas extended leading-code and position-code take the range 0xA0
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1838 through 0xFF. See `charset.h' for more details about leading-code
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1839 and position-code.
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
1840
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1841 --- CODE RANGE of Emacs' internal format ---
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1842 character set range
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1843 ------------- -----
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1844 ascii 0x00..0x7F
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1845 eight-bit-control LEADING_CODE_8_BIT_CONTROL + 0xA0..0xBF
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1846 eight-bit-graphic 0xA0..0xBF
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1847 ELSE 0x81..0x9D + [0xA0..0xFF]+
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1848 ---------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1849
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1850 As this is the internal character representation, the format is
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1851 usually not used externally (i.e. in a file or in a data sent to a
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1852 process). But, it is possible to have a text externally in this
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1853 format (i.e. by encoding by the coding system `emacs-mule').
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1854
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1855 In that case, a sequence of one-byte codes has a slightly different
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1856 form.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1857
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1858 At first, all characters in eight-bit-control are represented by
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1859 one-byte sequences which are their 8-bit code.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1860
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1861 Next, character composition data are represented by the byte
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1862 sequence of the form: 0x80 METHOD BYTES CHARS COMPONENT ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1863 where,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1864 METHOD is 0xF0 plus one of composition method (enum
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1865 composition_method),
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1866
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1867 BYTES is 0xA0 plus a byte length of this composition data,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1868
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1869 CHARS is 0x20 plus a number of characters composed by this
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1870 data,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1871
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1872 COMPONENTs are characters of multibye form or composition
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1873 rules encoded by two-byte of ASCII codes.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1874
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1875 In addition, for backward compatibility, the following formats are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1876 also recognized as composition data on decoding.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1877
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1878 0x80 MSEQ ...
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1879 0x80 0xFF MSEQ RULE MSEQ RULE ... MSEQ
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1880
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1881 Here,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1882 MSEQ is a multibyte form but in these special format:
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1883 ASCII: 0xA0 ASCII_CODE+0x80,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1884 other: LEADING_CODE+0x20 FOLLOWING-BYTE ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1885 RULE is a one byte code of the range 0xA0..0xF0 that
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1886 represents a composition rule.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1887 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1888
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1889 char emacs_mule_bytes[256];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1890
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1891 int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1892 emacs_mule_char (coding, src, nbytes, nchars, id)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1893 struct coding_system *coding;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1894 const unsigned char *src;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1895 int *nbytes, *nchars, *id;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1896 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1897 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1898 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1899 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1900 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1901 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1902 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1903 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1904
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1905 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1906 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1907 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1908 c = -c;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1909 charset = emacs_mule_charset[0];
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1910 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1911 else
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1912 {
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
1913 if (c >= 0xA0)
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
1914 {
92030
52c3ba60b54b Fix comment typo.
Glenn Morris <rgm@gnu.org>
parents: 91838
diff changeset
1915 /* Old style component character of a composition. */
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
1916 if (c == 0xA0)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1917 {
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
1918 ONE_MORE_BYTE (c);
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
1919 c -= 0x80;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1920 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1921 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1922 c -= 0x20;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1923 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1924
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1925 switch (emacs_mule_bytes[c])
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1926 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1927 case 2:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1928 if (! (charset = emacs_mule_charset[c]))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1929 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1930 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1931 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1932 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1933 code = c & 0x7F;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1934 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1935
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1936 case 3:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1937 if (c == EMACS_MULE_LEADING_CODE_PRIVATE_11
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1938 || c == EMACS_MULE_LEADING_CODE_PRIVATE_12)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1939 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1940 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1941 if (c < 0xA0 || ! (charset = emacs_mule_charset[c]))
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1942 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1943 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1944 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1945 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1946 code = c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1947 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
1948 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1949 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1950 if (! (charset = emacs_mule_charset[c]))
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1951 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1952 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1953 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1954 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1955 code = (c & 0x7F) << 8;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1956 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1957 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1958 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1959 code |= c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1960 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1961 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1962
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1963 case 4:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1964 ONE_MORE_BYTE (c);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1965 if (c < 0 || ! (charset = emacs_mule_charset[c]))
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1966 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1967 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1968 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1969 goto invalid_code;
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
1970 code = (c & 0x7F) << 8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1971 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
1972 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1973 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1974 code |= c & 0x7F;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1975 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1976
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1977 case 1:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1978 code = c;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1979 charset = CHARSET_FROM_ID (ASCII_BYTE_P (code)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1980 ? charset_ascii : charset_eight_bit);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1981 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1982
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1983 default:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1984 abort ();
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1985 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1986 c = DECODE_CHAR (charset, code);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1987 if (c < 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1988 goto invalid_code;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1989 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1990 *nbytes = src - src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1991 *nchars = consumed_chars;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1992 if (id)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1993 *id = charset->id;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1994 return c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1995
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1996 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1997 return -2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1998
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1999 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2000 return -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2001 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2002
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2003
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2004 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2005 Check if a text is encoded in `emacs-mule'. If it is, return 1,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2006 else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2007
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
2008 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2009 detect_coding_emacs_mule (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2010 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2011 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2012 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2013 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2014 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2015 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2016 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2017 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2018 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2019
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2020 detect_info->checked |= CATEGORY_MASK_EMACS_MULE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2021 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2022 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2023
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2024 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2025 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2026 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2027 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2028 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2029 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2030 if (c == 0x80)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2031 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2032 /* Perhaps the start of composite character. We simple skip
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2033 it because analyzing it is too heavy for detecting. But,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2034 at least, we check that the composite character
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
2035 constitutes of more than 4 bytes. */
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2036 const unsigned char *src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2037
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2038 repeat:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2039 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2040 do
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2041 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2042 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2043 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2044 while (c >= 0xA0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2045
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2046 if (src - src_base <= 4)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2047 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2048 found = CATEGORY_MASK_EMACS_MULE;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2049 if (c == 0x80)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2050 goto repeat;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2051 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2052
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2053 if (c < 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2054 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2055 if (c < 0x20
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2056 && (c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2057 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2058 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2059 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2060 {
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2061 int more_bytes = emacs_mule_bytes[*src_base] - 1;
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2062
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2063 while (more_bytes > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2064 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2065 ONE_MORE_BYTE (c);
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2066 if (c < 0xA0)
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2067 {
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2068 src--; /* Unread the last byte. */
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2069 break;
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2070 }
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2071 more_bytes--;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2072 }
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
2073 if (more_bytes != 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2074 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2075 found = CATEGORY_MASK_EMACS_MULE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2076 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2077 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2078 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2079 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2080
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2081 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2082 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
2083 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2084 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
2085 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
2086 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2087 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2088 return 1;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2089 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2090
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2091
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2092 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2093
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2094 /* Decode a character represented as a component of composition
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2095 sequence of Emacs 20/21 style at SRC. Set C to that character and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2096 update SRC to the head of next character (or an encoded composition
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2097 rule). If SRC doesn't points a composition component, set C to -1.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2098 If SRC points an invalid byte sequence, global exit by a return
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2099 value 0. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2101 #define DECODE_EMACS_MULE_COMPOSITION_CHAR(buf) \
91622
0a283ea23533 (DECODE_EMACS_MULE_COMPOSITION_CHAR): Use "do...while (0)".
Jan Djärv <jan.h.d@swipnet.se>
parents: 91535
diff changeset
2102 do \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2103 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2104 int c; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2105 int nbytes, nchars; \
51356
8da3b8a0ca4f (DECODE_EMACS_MULE_COMPOSITION_CHAR): If coding->flags
Kenichi Handa <handa@m17n.org>
parents: 51327
diff changeset
2106 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2107 if (src == src_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2108 break; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2109 c = emacs_mule_char (coding, src, &nbytes, &nchars, NULL);\
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2110 if (c < 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2111 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2112 if (c == -2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2113 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2114 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2115 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2116 *buf++ = c; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2117 src += nbytes; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2118 consumed_chars += nchars; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2119 } \
91622
0a283ea23533 (DECODE_EMACS_MULE_COMPOSITION_CHAR): Use "do...while (0)".
Jan Djärv <jan.h.d@swipnet.se>
parents: 91535
diff changeset
2120 while (0)
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2121
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2122
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2123 /* Decode a composition rule represented as a component of composition
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2124 sequence of Emacs 20 style at SRC. Store the decoded rule in *BUF,
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2125 and increment BUF. If SRC points an invalid byte sequence, set C
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2126 to -1. */
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2127
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2128 #define DECODE_EMACS_MULE_COMPOSITION_RULE_20(buf) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2129 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2130 int c, gref, nref; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2131 \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2132 if (src >= src_end) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2133 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2134 ONE_MORE_BYTE_NO_CHECK (c); \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2135 c -= 0xA0; \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2136 if (c < 0 || c >= 81) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2137 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2138 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2139 gref = c / 9, nref = c % 9; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2140 *buf++ = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2141 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2142
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2143
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2144 /* Decode a composition rule represented as a component of composition
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2145 sequence of Emacs 21 style at SRC. Store the decoded rule in *BUF,
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2146 and increment BUF. If SRC points an invalid byte sequence, set C
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2147 to -1. */
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2148
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2149 #define DECODE_EMACS_MULE_COMPOSITION_RULE_21(buf) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2150 do { \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2151 int gref, nref; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2152 \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2153 if (src + 1>= src_end) \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2154 goto invalid_code; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2155 ONE_MORE_BYTE_NO_CHECK (gref); \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2156 gref -= 0x20; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2157 ONE_MORE_BYTE_NO_CHECK (nref); \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2158 nref -= 0x20; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2159 if (gref < 0 || gref >= 81 \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2160 || nref < 0 || nref >= 81) \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2161 goto invalid_code; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2162 *buf++ = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2163 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2164
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2165
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2166 #define DECODE_EMACS_MULE_21_COMPOSITION(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2167 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2168 /* Emacs 21 style format. The first three bytes at SRC are \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2169 (METHOD - 0xF2), (BYTES - 0xA0), (CHARS - 0xA0), where BYTES is \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2170 the byte length of this composition information, CHARS is the \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2171 number of characters composed by this composition. */ \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2172 enum composition_method method = c - 0xF2; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2173 int *charbuf_base = charbuf; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2174 int consumed_chars_limit; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2175 int nbytes, nchars; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2176 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2177 ONE_MORE_BYTE (c); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2178 if (c < 0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2179 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2180 nbytes = c - 0xA0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2181 if (nbytes < 3) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2182 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2183 ONE_MORE_BYTE (c); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2184 if (c < 0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2185 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2186 nchars = c - 0xA0; \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2187 ADD_COMPOSITION_DATA (charbuf, nchars, method); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2188 consumed_chars_limit = consumed_chars_base + nbytes; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2189 if (method != COMPOSITION_RELATIVE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2190 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2191 int i = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2192 while (consumed_chars < consumed_chars_limit) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2193 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2194 if (i % 2 && method != COMPOSITION_WITH_ALTCHARS) \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2195 DECODE_EMACS_MULE_COMPOSITION_RULE_21 (charbuf); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2196 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2197 DECODE_EMACS_MULE_COMPOSITION_CHAR (charbuf); \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2198 i++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2199 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2200 if (consumed_chars < consumed_chars_limit) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2201 goto invalid_code; \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2202 charbuf_base[0] -= i; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2203 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2204 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2205
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2206
90363
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2207 #define DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION(c) \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2208 do { \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2209 /* Emacs 20 style format for relative composition. */ \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2210 /* Store multibyte form of characters to be composed. */ \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2211 enum composition_method method = COMPOSITION_RELATIVE; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2212 int components[MAX_COMPOSITION_COMPONENTS * 2 - 1]; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2213 int *buf = components; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2214 int i, j; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2215 \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2216 src = src_base; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2217 ONE_MORE_BYTE (c); /* skip 0x80 */ \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2218 for (i = 0; *src >= 0xA0 && i < MAX_COMPOSITION_COMPONENTS; i++) \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2219 DECODE_EMACS_MULE_COMPOSITION_CHAR (buf); \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2220 if (i < 2) \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2221 goto invalid_code; \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2222 ADD_COMPOSITION_DATA (charbuf, i, method); \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2223 for (j = 0; j < i; j++) \
ec0a46fadd7e (DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION): Fix
Kenichi Handa <handa@m17n.org>
parents: 90359
diff changeset
2224 *charbuf++ = components[j]; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2225 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2226
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2227
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2228 #define DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2229 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2230 /* Emacs 20 style format for rule-base composition. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2231 /* Store multibyte form of characters to be composed. */ \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2232 enum composition_method method = COMPOSITION_WITH_RULE; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2233 int *charbuf_base = charbuf; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2234 int components[MAX_COMPOSITION_COMPONENTS * 2 - 1]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2235 int *buf = components; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2236 int i, j; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2237 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2238 DECODE_EMACS_MULE_COMPOSITION_CHAR (buf); \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2239 for (i = 1; i < MAX_COMPOSITION_COMPONENTS; i++) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2240 { \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2241 if (*src < 0xA0) \
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2242 break; \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2243 DECODE_EMACS_MULE_COMPOSITION_RULE_20 (buf); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2244 DECODE_EMACS_MULE_COMPOSITION_CHAR (buf); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2245 } \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2246 if (i <= 1 || (buf - components) % 2 == 0) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2247 goto invalid_code; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2248 if (charbuf + i + (i / 2) + 1 >= charbuf_end) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2249 goto no_more_source; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2250 ADD_COMPOSITION_DATA (charbuf, i, method); \
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2251 i = i * 2 - 1; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2252 for (j = 0; j < i; j++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2253 *charbuf++ = components[j]; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2254 charbuf_base[0] -= i; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2255 for (j = 0; j < i; j += 2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2256 *charbuf++ = components[j]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2257 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2258
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2259
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2260 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2261 decode_coding_emacs_mule (coding)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2262 struct coding_system *coding;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2263 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2264 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2265 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
2266 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2267 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2268 int *charbuf_end
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2269 = coding->charbuf + coding->charbuf_size - MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2270 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2271 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2272 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2273 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2274 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2275 int last_id = charset_ascii;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2276 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2277 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2278
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2279 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2280
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2281 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2282 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2283 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2284
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2285 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2286 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2287
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2288 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2289 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2290
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2291 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2292 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2293 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2294 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2295 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2296 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2297 *charbuf++ = -c;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2298 char_offset++;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2299 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2300 else if (c < 0x80)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2301 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2302 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2303 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2304 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2305 char_offset++;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2306 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2307 else if (c == 0x80)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2308 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2309 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2310 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2311 goto invalid_code;
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2312 if (c - 0xF2 >= COMPOSITION_RELATIVE
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2313 && c - 0xF2 <= COMPOSITION_WITH_RULE_ALTCHARS)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2314 DECODE_EMACS_MULE_21_COMPOSITION (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2315 else if (c < 0xC0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2316 DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2317 else if (c == 0xFF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2318 DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2319 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2320 goto invalid_code;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2321 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2322 else if (c < 0xA0 && emacs_mule_bytes[c] > 1)
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2323 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2324 int nbytes, nchars;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2325 int id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2326
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2327 src = src_base;
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2328 consumed_chars = consumed_chars_base;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2329 c = emacs_mule_char (coding, src, &nbytes, &nchars, &id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2330 if (c < 0)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2331 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2332 if (c == -2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2333 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2334 goto invalid_code;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2335 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2336 if (last_id != id)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2337 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2338 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2339 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2340 last_id = id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2341 last_offset = char_offset;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2342 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2343 *charbuf++ = c;
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2344 src += nbytes;
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2345 consumed_chars += nchars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2346 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2347 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2348 else
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2349 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2350 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2351
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2352 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2353 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2354 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2355 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2356 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2357 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2358 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2359 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2360
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2361 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2362 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2363 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2364 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2365 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2366 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2367 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2368
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2369
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2370 #define EMACS_MULE_LEADING_CODES(id, codes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2371 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2372 if (id < 0xA0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2373 codes[0] = id, codes[1] = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2374 else if (id < 0xE0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2375 codes[0] = 0x9A, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2376 else if (id < 0xF0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2377 codes[0] = 0x9B, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2378 else if (id < 0xF5) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2379 codes[0] = 0x9C, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2380 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2381 codes[0] = 0x9D, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2382 } while (0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2383
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2384
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2385 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2386 encode_coding_emacs_mule (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2387 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2388 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2389 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2390 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2391 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2392 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2393 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2394 int safe_room = 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2395 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2396 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2397 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2398 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2399
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2400 CODING_GET_INFO (coding, attrs, charset_list);
89644
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2401 if (! EQ (charset_list, Vemacs_mule_charset_list))
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2402 {
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2403 CODING_ATTR_CHARSET_LIST (attrs)
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2404 = charset_list = Vemacs_mule_charset_list;
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2405 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2406
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2407 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2408 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2409 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2410 c = *charbuf++;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2411
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2412 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2413 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2414 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2415 switch (*charbuf)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2416 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2417 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2418 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2419 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2420 case CODING_ANNOTATE_CHARSET_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2421 preferred_charset_id = charbuf[3];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2422 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2423 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2424 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2425 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2426 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2427 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2428 abort ();
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2429 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2430 charbuf += -c - 1;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2431 continue;
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2432 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2433
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2434 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2435 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2436 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2437 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2438 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2439 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2440 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2441 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2442 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2443 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2444 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2445 int dimension;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2446 int emacs_mule_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2447 unsigned char leading_codes[2];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2448
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2449 if (preferred_charset_id >= 0)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2450 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2451 charset = CHARSET_FROM_ID (preferred_charset_id);
100176
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2452 if (CHAR_CHARSET_P (c, charset))
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2453 code = ENCODE_CHAR (charset, c);
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2454 else
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2455 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2456 }
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2457 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2458 charset = char_charset (c, charset_list, &code);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2459 if (! charset)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2460 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2461 c = coding->default_char;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2462 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2463 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2464 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2465 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2466 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2467 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2468 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2469 dimension = CHARSET_DIMENSION (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2470 emacs_mule_id = CHARSET_EMACS_MULE_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2471 EMACS_MULE_LEADING_CODES (emacs_mule_id, leading_codes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2472 EMIT_ONE_BYTE (leading_codes[0]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2473 if (leading_codes[1])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2474 EMIT_ONE_BYTE (leading_codes[1]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2475 if (dimension == 1)
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2476 EMIT_ONE_BYTE (code | 0x80);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2477 else
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2478 {
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2479 code |= 0x8080;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2480 EMIT_ONE_BYTE (code >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2481 EMIT_ONE_BYTE (code & 0xFF);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2482 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2483 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2484 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2485 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2486 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2487 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2488 return 0;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2489 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2490
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2491
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2492 /*** 7. ISO2022 handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2493
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2494 /* The following note describes the coding system ISO2022 briefly.
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2495 Since the intention of this note is to help understand the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2496 functions in this file, some parts are NOT ACCURATE or are OVERLY
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2497 SIMPLIFIED. For thorough understanding, please refer to the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2498 original document of ISO2022. This is equivalent to the standard
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2499 ECMA-35, obtainable from <URL:http://www.ecma.ch/> (*).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2500
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2501 ISO2022 provides many mechanisms to encode several character sets
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2502 in 7-bit and 8-bit environments. For 7-bit environments, all text
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2503 is encoded using bytes less than 128. This may make the encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2504 text a little bit longer, but the text passes more easily through
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2505 several types of gateway, some of which strip off the MSB (Most
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2506 Significant Bit).
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2507
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2508 There are two kinds of character sets: control character sets and
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2509 graphic character sets. The former contain control characters such
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2510 as `newline' and `escape' to provide control functions (control
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2511 functions are also provided by escape sequences). The latter
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2512 contain graphic characters such as 'A' and '-'. Emacs recognizes
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2513 two control character sets and many graphic character sets.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2514
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2515 Graphic character sets are classified into one of the following
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2516 four classes, according to the number of bytes (DIMENSION) and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2517 number of characters in one dimension (CHARS) of the set:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2518 - DIMENSION1_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2519 - DIMENSION1_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2520 - DIMENSION2_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2521 - DIMENSION2_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2522
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2523 In addition, each character set is assigned an identification tag,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2524 unique for each set, called the "final character" (denoted as <F>
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2525 hereafter). The <F> of each character set is decided by ECMA(*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2526 when it is registered in ISO. The code range of <F> is 0x30..0x7F
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2527 (0x30..0x3F are for private use only).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2528
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2529 Note (*): ECMA = European Computer Manufacturers Association
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2530
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2531 Here are examples of graphic character sets [NAME(<F>)]:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2532 o DIMENSION1_CHARS94 -- ASCII('B'), right-half-of-JISX0201('I'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2533 o DIMENSION1_CHARS96 -- right-half-of-ISO8859-1('A'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2534 o DIMENSION2_CHARS94 -- GB2312('A'), JISX0208('B'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2535 o DIMENSION2_CHARS96 -- none for the moment
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2536
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2537 A code area (1 byte=8 bits) is divided into 4 areas, C0, GL, C1, and GR.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2538 C0 [0x00..0x1F] -- control character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2539 GL [0x20..0x7F] -- graphic character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2540 C1 [0x80..0x9F] -- control character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2541 GR [0xA0..0xFF] -- graphic character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2542
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2543 A control character set is directly designated and invoked to C0 or
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2544 C1 by an escape sequence. The most common case is that:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2545 - ISO646's control character set is designated/invoked to C0, and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2546 - ISO6429's control character set is designated/invoked to C1,
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2547 and usually these designations/invocations are omitted in encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2548 text. In a 7-bit environment, only C0 can be used, and a control
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2549 character for C1 is encoded by an appropriate escape sequence to
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2550 fit into the environment. All control characters for C1 are
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2551 defined to have corresponding escape sequences.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2552
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2553 A graphic character set is at first designated to one of four
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2554 graphic registers (G0 through G3), then these graphic registers are
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2555 invoked to GL or GR. These designations and invocations can be
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2556 done independently. The most common case is that G0 is invoked to
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2557 GL, G1 is invoked to GR, and ASCII is designated to G0. Usually
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2558 these invocations and designations are omitted in encoded text.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2559 In a 7-bit environment, only GL can be used.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2560
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2561 When a graphic character set of CHARS94 is invoked to GL, codes
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2562 0x20 and 0x7F of the GL area work as control characters SPACE and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2563 DEL respectively, and codes 0xA0 and 0xFF of the GR area should not
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2564 be used.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2565
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2566 There are two ways of invocation: locking-shift and single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2567 With locking-shift, the invocation lasts until the next different
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2568 invocation, whereas with single-shift, the invocation affects the
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2569 following character only and doesn't affect the locking-shift
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2570 state. Invocations are done by the following control characters or
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2571 escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2572
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2573 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2574 abbrev function cntrl escape seq description
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2575 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2576 SI/LS0 (shift-in) 0x0F none invoke G0 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2577 SO/LS1 (shift-out) 0x0E none invoke G1 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2578 LS2 (locking-shift-2) none ESC 'n' invoke G2 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2579 LS3 (locking-shift-3) none ESC 'o' invoke G3 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2580 LS1R (locking-shift-1 right) none ESC '~' invoke G1 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2581 LS2R (locking-shift-2 right) none ESC '}' invoke G2 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2582 LS3R (locking-shift 3 right) none ESC '|' invoke G3 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2583 SS2 (single-shift-2) 0x8E ESC 'N' invoke G2 for one char
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2584 SS3 (single-shift-3) 0x8F ESC 'O' invoke G3 for one char
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2585 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2586 (*) These are not used by any known coding system.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2587
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2588 Control characters for these functions are defined by macros
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2589 ISO_CODE_XXX in `coding.h'.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2590
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2591 Designations are done by the following escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2592 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2593 escape sequence description
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2594 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2595 ESC '(' <F> designate DIMENSION1_CHARS94<F> to G0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2596 ESC ')' <F> designate DIMENSION1_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2597 ESC '*' <F> designate DIMENSION1_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2598 ESC '+' <F> designate DIMENSION1_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2599 ESC ',' <F> designate DIMENSION1_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2600 ESC '-' <F> designate DIMENSION1_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2601 ESC '.' <F> designate DIMENSION1_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2602 ESC '/' <F> designate DIMENSION1_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2603 ESC '$' '(' <F> designate DIMENSION2_CHARS94<F> to G0 (**)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2604 ESC '$' ')' <F> designate DIMENSION2_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2605 ESC '$' '*' <F> designate DIMENSION2_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2606 ESC '$' '+' <F> designate DIMENSION2_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2607 ESC '$' ',' <F> designate DIMENSION2_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2608 ESC '$' '-' <F> designate DIMENSION2_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2609 ESC '$' '.' <F> designate DIMENSION2_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2610 ESC '$' '/' <F> designate DIMENSION2_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2611 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2612
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2613 In this list, "DIMENSION1_CHARS94<F>" means a graphic character set
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2614 of dimension 1, chars 94, and final character <F>, etc...
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2615
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2616 Note (*): Although these designations are not allowed in ISO2022,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2617 Emacs accepts them on decoding, and produces them on encoding
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2618 CHARS96 character sets in a coding system which is characterized as
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2619 7-bit environment, non-locking-shift, and non-single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2620
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2621 Note (**): If <F> is '@', 'A', or 'B', the intermediate character
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2622 '(' must be omitted. We refer to this as "short-form" hereafter.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2623
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2624 Now you may notice that there are a lot of ways of encoding the
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2625 same multilingual text in ISO2022. Actually, there exist many
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2626 coding systems such as Compound Text (used in X11's inter client
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2627 communication, ISO-2022-JP (used in Japanese Internet), ISO-2022-KR
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2628 (used in Korean Internet), EUC (Extended UNIX Code, used in Asian
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2629 localized platforms), and all of these are variants of ISO2022.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2630
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2631 In addition to the above, Emacs handles two more kinds of escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2632 sequences: ISO6429's direction specification and Emacs' private
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2633 sequence for specifying character composition.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2634
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2635 ISO6429's direction specification takes the following form:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2636 o CSI ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2637 o CSI '0' ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2638 o CSI '1' ']' -- start of left-to-right text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2639 o CSI '2' ']' -- start of right-to-left text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2640 The control character CSI (0x9B: control sequence introducer) is
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2641 abbreviated to the escape sequence ESC '[' in a 7-bit environment.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2642
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2643 Character composition specification takes the following form:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2644 o ESC '0' -- start relative composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2645 o ESC '1' -- end composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2646 o ESC '2' -- start rule-base composition (*)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2647 o ESC '3' -- start relative composition with alternate chars (**)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2648 o ESC '4' -- start rule-base composition with alternate chars (**)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2649 Since these are not standard escape sequences of any ISO standard,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2650 the use of them with these meanings is restricted to Emacs only.
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2651
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2652 (*) This form is used only in Emacs 20.7 and older versions,
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2653 but newer versions can safely decode it.
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2654 (**) This form is used only in Emacs 21.1 and newer versions,
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2655 and older versions can't decode it.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2656
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2657 Here's a list of example usages of these composition escape
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2658 sequences (categorized by `enum composition_method').
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2659
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2660 COMPOSITION_RELATIVE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2661 ESC 0 CHAR [ CHAR ] ESC 1
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2662 COMPOSITION_WITH_RULE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2663 ESC 2 CHAR [ RULE CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2664 COMPOSITION_WITH_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2665 ESC 3 ALTCHAR [ ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2666 COMPOSITION_WITH_RULE_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2667 ESC 4 ALTCHAR [ RULE ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2668
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2669 enum iso_code_class_type iso_code_class[256];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2670
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2671 #define SAFE_CHARSET_P(coding, id) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2672 ((id) <= (coding)->max_charset_id \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2673 && (coding)->safe_charsets[id] >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2674
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2675
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2676 #define SHIFT_OUT_OK(category) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2677 (CODING_ISO_INITIAL (&coding_categories[category], 1) >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2678
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2679 static void
88631
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
2680 setup_iso_safe_charsets (attrs)
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
2681 Lisp_Object attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2682 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2683 Lisp_Object charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2684 Lisp_Object request;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2685 Lisp_Object reg_usage;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2686 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2687 int reg94, reg96;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2688 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2689 int max_charset_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2691 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2692 if ((flags & CODING_ISO_FLAG_FULL_SUPPORT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2693 && ! EQ (charset_list, Viso_2022_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2694 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2695 CODING_ATTR_CHARSET_LIST (attrs)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2696 = charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2697 ASET (attrs, coding_attr_safe_charsets, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2698 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2699
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2700 if (STRINGP (AREF (attrs, coding_attr_safe_charsets)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2701 return;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2702
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2703 max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2704 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2705 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2706 int id = XINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2707 if (max_charset_id < id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2708 max_charset_id = id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2709 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2710
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2711 safe_charsets = Fmake_string (make_number (max_charset_id + 1),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2712 make_number (255));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2713 request = AREF (attrs, coding_attr_iso_request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2714 reg_usage = AREF (attrs, coding_attr_iso_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2715 reg94 = XINT (XCAR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2716 reg96 = XINT (XCDR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2717
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2718 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2719 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2720 Lisp_Object id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2721 Lisp_Object reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2722 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2723
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2724 id = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2725 charset = CHARSET_FROM_ID (XINT (id));
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
2726 reg = Fcdr (Fassq (id, request));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2727 if (! NILP (reg))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2728 SSET (safe_charsets, XINT (id), XINT (reg));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2729 else if (charset->iso_chars_96)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2730 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2731 if (reg96 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2732 SSET (safe_charsets, XINT (id), reg96);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2733 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2734 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2735 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2736 if (reg94 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2737 SSET (safe_charsets, XINT (id), reg94);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2738 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2739 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2740 ASET (attrs, coding_attr_safe_charsets, safe_charsets);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2741 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2742
50047
8e17fbb2ac77 (CODING_ADD_COMPOSITION_COMPONENT): If the number of
Kenichi Handa <handa@m17n.org>
parents: 49600
diff changeset
2743
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2744 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2745 Check if a text is encoded in one of ISO-2022 based codig systems.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2746 If it is, return 1, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2747
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
2748 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2749 detect_coding_iso_2022 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2750 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2751 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2752 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2753 const unsigned char *src = coding->source, *src_base = src;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2754 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2755 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2756 int single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2757 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2758 int c, c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2759 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2760 int i;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2761 int rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2762 int found = 0;
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2763 int composition_count = -1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2764
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2765 detect_info->checked |= CATEGORY_MASK_ISO;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2766
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2767 for (i = coding_category_iso_7; i <= coding_category_iso_8_else; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2768 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2769 struct coding_system *this = &(coding_categories[i]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2770 Lisp_Object attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2771
94944
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
2772 if (this->id < 0)
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
2773 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2774 attrs = CODING_ID_ATTRS (this->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2775 if (CODING_ISO_FLAGS (this) & CODING_ISO_FLAG_FULL_SUPPORT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2776 && ! EQ (CODING_ATTR_SAFE_CHARSETS (attrs), Viso_2022_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2777 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2778 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2779 this->max_charset_id = SCHARS (val) - 1;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2780 this->safe_charsets = (char *) SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2781 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2782
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2783 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2784 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2785
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2786 while (rejected != CATEGORY_MASK_ISO)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2787 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2788 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2789 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2790 switch (c)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2791 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2792 case ISO_CODE_ESC:
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
2793 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
2794 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2795 single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2796 ONE_MORE_BYTE (c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2797 if (c >= '(' && c <= '/')
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2798 {
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2799 /* Designation sequence for a charset of dimension 1. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2800 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2801 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2802 || (id = iso_charset_table[0][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2803 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2804 break;
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2805 }
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2806 else if (c == '$')
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2807 {
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2808 /* Designation sequence for a charset of dimension 2. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2809 ONE_MORE_BYTE (c);
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2810 if (c >= '@' && c <= 'B')
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2811 /* Designation for JISX0208.1978, GB2312, or JISX0208. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2812 id = iso_charset_table[1][0][c];
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2813 else if (c >= '(' && c <= '/')
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
2814 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2815 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2816 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2817 || (id = iso_charset_table[1][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2818 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2819 break;
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
2820 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2821 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2822 /* Invalid designation sequence. Just ignore it. */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2823 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2824 }
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
2825 else if (c == 'N' || c == 'O')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2826 {
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
2827 /* ESC <Fe> for SS2 or SS3. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2828 single_shifting = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2829 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2830 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2831 }
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2832 else if (c == '1')
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2833 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2834 /* End of composition. */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2835 if (composition_count < 0
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2836 || composition_count > MAX_COMPOSITION_COMPONENTS)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2837 /* Invalid */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2838 break;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2839 composition_count = -1;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2840 found |= CATEGORY_MASK_ISO;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2841 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2842 else if (c >= '0' && c <= '4')
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2843 {
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2844 /* ESC <Fp> for start/end composition. */
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2845 composition_count = 0;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2846 break;
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2847 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
2848 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2849 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2850 /* Invalid escape sequence. Just ignore it. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2851 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2852 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2853
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2854 /* We found a valid designation sequence for CHARSET. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2855 rejected |= CATEGORY_MASK_ISO_8BIT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2856 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2857 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2858 found |= CATEGORY_MASK_ISO_7;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2859 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2860 rejected |= CATEGORY_MASK_ISO_7;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2861 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_tight],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2862 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2863 found |= CATEGORY_MASK_ISO_7_TIGHT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2864 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2865 rejected |= CATEGORY_MASK_ISO_7_TIGHT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2866 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2867 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2868 found |= CATEGORY_MASK_ISO_7_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
2869 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2870 rejected |= CATEGORY_MASK_ISO_7_ELSE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2871 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_8_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2872 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2873 found |= CATEGORY_MASK_ISO_8_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
2874 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2875 rejected |= CATEGORY_MASK_ISO_8_ELSE;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2876 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2877
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2878 case ISO_CODE_SO:
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2879 case ISO_CODE_SI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2880 /* Locking shift out/in. */
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
2881 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
2882 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2883 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2884 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2885 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
2886
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2887 case ISO_CODE_CSI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2888 /* Control sequence introducer. */
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2889 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2890 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2891 found |= CATEGORY_MASK_ISO_8_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2892 goto check_extra_latin;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2893
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2894 case ISO_CODE_SS2:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2895 case ISO_CODE_SS3:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2896 /* Single shift. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2897 if (inhibit_iso_escape_detection)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2898 break;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2899 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2900 rejected |= CATEGORY_MASK_ISO_7BIT;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2901 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2902 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2903 found |= CATEGORY_MASK_ISO_8_1, single_shifting = 1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2904 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_2])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2905 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2906 found |= CATEGORY_MASK_ISO_8_2, single_shifting = 1;
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2907 if (single_shifting)
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2908 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2909 goto check_extra_latin;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2910
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2911 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2912 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2913 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2914 if (c < 0x80)
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2915 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2916 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2917 composition_count++;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2918 single_shifting = 0;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2919 break;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2920 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2921 if (c >= 0xA0)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
2922 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2923 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2924 found |= CATEGORY_MASK_ISO_8_1;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2925 /* Check the length of succeeding codes of the range
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2926 0xA0..0FF. If the byte length is even, we include
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2927 CATEGORY_MASK_ISO_8_2 in `found'. We can check this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2928 only when we are not single shifting. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2929 if (! single_shifting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2930 && ! (rejected & CATEGORY_MASK_ISO_8_2))
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2931 {
29299
b33b38d81020 (detect_coding_iso2022): Fix code for checking
Kenichi Handa <handa@m17n.org>
parents: 29275
diff changeset
2932 int i = 1;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2933 while (src < src_end)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2934 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2935 ONE_MORE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2936 if (c < 0xA0)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2937 break;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2938 i++;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2939 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2940
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2941 if (i & 1 && src < src_end)
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2942 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2943 rejected |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2944 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2945 composition_count += i;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2946 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2947 else
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2948 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2949 found |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2950 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2951 composition_count += i / 2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
2952 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
2953 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2954 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2955 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2956 check_extra_latin:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2957 single_shifting = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2958 if (! VECTORP (Vlatin_extra_code_table)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2959 || NILP (XVECTOR (Vlatin_extra_code_table)->contents[c]))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2960 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2961 rejected = CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2962 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2963 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2964 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2965 & CODING_ISO_FLAG_LATIN_EXTRA)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2966 found |= CATEGORY_MASK_ISO_8_1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2967 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2968 rejected |= CATEGORY_MASK_ISO_8_1;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
2969 rejected |= CATEGORY_MASK_ISO_8_2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2970 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2971 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2972 detect_info->rejected |= CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2973 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2974
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2975 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2976 detect_info->rejected |= rejected;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2977 detect_info->found |= (found & ~rejected);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2978 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2979 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2980
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2981
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
2982 /* Set designation state into CODING. Set CHARS_96 to -1 if the
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
2983 escape sequence should be kept. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2984 #define DECODE_DESIGNATION(reg, dim, chars_96, final) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2985 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2986 int id, prev; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2987 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2988 if (final < '0' || final >= 128 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2989 || ((id = ISO_CHARSET_TABLE (dim, chars_96, final)) < 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2990 || !SAFE_CHARSET_P (coding, id)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2991 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2992 CODING_ISO_DESIGNATION (coding, reg) = -2; \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
2993 chars_96 = -1; \
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
2994 break; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2995 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2996 prev = CODING_ISO_DESIGNATION (coding, reg); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
2997 if (id == charset_jisx0201_roman) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
2998 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
2999 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3000 id = charset_ascii; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3001 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3002 else if (id == charset_jisx0208_1978) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3003 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3004 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3005 id = charset_jisx0208; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3006 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3007 CODING_ISO_DESIGNATION (coding, reg) = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3008 /* If there was an invalid designation to REG previously, and this \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3009 designation is ASCII to REG, we should keep this designation \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3010 sequence. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3011 if (prev == -2 && id == charset_ascii) \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3012 chars_96 = -1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3013 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3014
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3015
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3016 #define MAYBE_FINISH_COMPOSITION() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3017 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3018 int i; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3019 if (composition_state == COMPOSING_NO) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3020 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3021 /* It is assured that we have enough room for producing \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3022 characters stored in the table `components'. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3023 if (charbuf + component_idx > charbuf_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3024 goto no_more_source; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3025 composition_state = COMPOSING_NO; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3026 if (method == COMPOSITION_RELATIVE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3027 || method == COMPOSITION_WITH_ALTCHARS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3028 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3029 for (i = 0; i < component_idx; i++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3030 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3031 char_offset += component_idx; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3032 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3033 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3034 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3035 for (i = 0; i < component_idx; i += 2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3036 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3037 char_offset += (component_idx / 2) + 1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3038 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3039 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3040
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3041
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3042 /* Handle composition start sequence ESC 0, ESC 2, ESC 3, or ESC 4.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3043 ESC 0 : relative composition : ESC 0 CHAR ... ESC 1
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3044 ESC 2 : rulebase composition : ESC 2 CHAR RULE CHAR RULE ... CHAR ESC 1
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3045 ESC 3 : altchar composition : ESC 3 CHAR ... ESC 0 CHAR ... ESC 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3046 ESC 4 : alt&rule composition : ESC 4 CHAR RULE ... CHAR ESC 0 CHAR ... ESC 1
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3047 */
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3048
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3049 #define DECODE_COMPOSITION_START(c1) \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3050 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3051 if (c1 == '0' \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3052 && composition_state == COMPOSING_COMPONENT_RULE) \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3053 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3054 component_len = component_idx; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3055 composition_state = COMPOSING_CHAR; \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3056 } \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3057 else \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3058 { \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3059 const unsigned char *p; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3060 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3061 MAYBE_FINISH_COMPOSITION (); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3062 if (charbuf + MAX_COMPOSITION_COMPONENTS > charbuf_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3063 goto no_more_source; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3064 for (p = src; p < src_end - 1; p++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3065 if (*p == ISO_CODE_ESC && p[1] == '1') \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3066 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3067 if (p == src_end - 1) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3068 { \
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3069 if (coding->mode & CODING_MODE_LAST_BLOCK) \
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3070 goto invalid_code; \
90350
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
3071 /* The current composition doesn't end in the current \
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
3072 source. */ \
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
3073 record_conversion_result \
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
3074 (coding, CODING_RESULT_INSUFFICIENT_SRC); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3075 goto no_more_source; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3076 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3077 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3078 /* This is surely the start of a composition. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3079 method = (c1 == '0' ? COMPOSITION_RELATIVE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3080 : c1 == '2' ? COMPOSITION_WITH_RULE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3081 : c1 == '3' ? COMPOSITION_WITH_ALTCHARS \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3082 : COMPOSITION_WITH_RULE_ALTCHARS); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3083 composition_state = (c1 <= '2' ? COMPOSING_CHAR \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3084 : COMPOSING_COMPONENT_CHAR); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3085 component_idx = component_len = 0; \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3086 } \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3087 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3088
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3089
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3090 /* Handle compositoin end sequence ESC 1. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3091
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3092 #define DECODE_COMPOSITION_END() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3093 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3094 int nchars = (component_len > 0 ? component_idx - component_len \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3095 : method == COMPOSITION_RELATIVE ? component_idx \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3096 : (component_idx + 1) / 2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3097 int i; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3098 int *saved_charbuf = charbuf; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3099 \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3100 ADD_COMPOSITION_DATA (charbuf, nchars, method); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3101 if (method != COMPOSITION_RELATIVE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3102 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3103 if (component_len == 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3104 for (i = 0; i < component_idx; i++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3105 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3106 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3107 for (i = 0; i < component_len; i++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3108 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3109 *saved_charbuf = saved_charbuf - charbuf; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3110 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3111 if (method == COMPOSITION_WITH_RULE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3112 for (i = 0; i < component_idx; i += 2, char_offset++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3113 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3114 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3115 for (i = component_len; i < component_idx; i++, char_offset++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3116 *charbuf++ = components[i]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3117 coding->annotated = 1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3118 composition_state = COMPOSING_NO; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3119 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3120
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3121
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3122 /* Decode a composition rule from the byte C1 (and maybe one more byte
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3123 from SRC) and store one encoded composition rule in
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3124 coding->cmp_data. */
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3125
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3126 #define DECODE_COMPOSITION_RULE(c1) \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3127 do { \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3128 (c1) -= 32; \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3129 if (c1 < 81) /* old format (before ver.21) */ \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3130 { \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3131 int gref = (c1) / 9; \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3132 int nref = (c1) % 9; \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3133 if (gref == 4) gref = 10; \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3134 if (nref == 4) nref = 10; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3135 c1 = COMPOSITION_ENCODE_RULE (gref, nref); \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3136 } \
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3137 else if (c1 < 93) /* new format (after ver.21) */ \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3138 { \
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3139 ONE_MORE_BYTE (c2); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3140 c1 = COMPOSITION_ENCODE_RULE (c1 - 81, c2 - 32); \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3141 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3142 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3143 c1 = 0; \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3144 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3145
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3146
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3147 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3148
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3149 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3150 decode_coding_iso_2022 (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3151 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3152 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3153 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3154 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3155 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3156 int *charbuf = coding->charbuf + coding->charbuf_used;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3157 int *charbuf_end
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3158 = coding->charbuf + coding->charbuf_size - 4 - MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3159 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3160 int multibytep = coding->src_multibyte;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3161 /* Charsets invoked to graphic plane 0 and 1 respectively. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3162 int charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3163 int charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3164 int charset_id_2, charset_id_3;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3165 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3166 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3167 /* For handling composition sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3168 #define COMPOSING_NO 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3169 #define COMPOSING_CHAR 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3170 #define COMPOSING_RULE 2
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3171 #define COMPOSING_COMPONENT_CHAR 3
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3172 #define COMPOSING_COMPONENT_RULE 4
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3173
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3174 int composition_state = COMPOSING_NO;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3175 enum composition_method method;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3176 int components[MAX_COMPOSITION_COMPONENTS * 2 + 1];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3177 int component_idx;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3178 int component_len;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3179 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3180 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3181 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3182 int last_id = charset_ascii;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3183 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3184 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3185
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3186 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3187 setup_iso_safe_charsets (attrs);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3188 /* Charset list may have been changed. */
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3189 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3190 coding->safe_charsets = (char *) SDATA (CODING_ATTR_SAFE_CHARSETS(attrs));
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3191
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3192 while (1)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3193 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3194 int c1, c2;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3195
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3196 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3197 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3198
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3199 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3200 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3201
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3202 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3203 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3204 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3205 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3206 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3207 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3208
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
3209 /* We produce at most one character. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3210 switch (iso_code_class [c1])
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3211 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3212 case ISO_0x20_or_0x7F:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3213 if (composition_state != COMPOSING_NO)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3214 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3215 if (composition_state == COMPOSING_RULE
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3216 || composition_state == COMPOSING_COMPONENT_RULE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3217 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3218 if (component_idx < MAX_COMPOSITION_COMPONENTS * 2 + 1)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3219 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3220 DECODE_COMPOSITION_RULE (c1);
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3221 components[component_idx++] = c1;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3222 composition_state--;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3223 continue;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3224 }
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3225 /* Too long composition. */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3226 MAYBE_FINISH_COMPOSITION ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3227 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3228 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3229 if (charset_id_0 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3230 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_0)))
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3231 /* This is SPACE or DEL. */
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3232 charset = CHARSET_FROM_ID (charset_ascii);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3233 else
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3234 charset = CHARSET_FROM_ID (charset_id_0);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3235 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3236
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3237 case ISO_graphic_plane_0:
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3238 if (composition_state != COMPOSING_NO)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3239 {
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3240 if (composition_state == COMPOSING_RULE
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3241 || composition_state == COMPOSING_COMPONENT_RULE)
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3242 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3243 if (component_idx < MAX_COMPOSITION_COMPONENTS * 2 + 1)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3244 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3245 DECODE_COMPOSITION_RULE (c1);
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3246 components[component_idx++] = c1;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3247 composition_state--;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3248 continue;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3249 }
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3250 MAYBE_FINISH_COMPOSITION ();
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3251 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3252 }
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3253 if (charset_id_0 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3254 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3255 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3256 charset = CHARSET_FROM_ID (charset_id_0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3257 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3258
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3259 case ISO_0xA0_or_0xFF:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3260 if (charset_id_1 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3261 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3262 || CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3263 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3264 /* This is a graphic character, we fall down ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3265
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3266 case ISO_graphic_plane_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3267 if (charset_id_1 < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3268 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3269 charset = CHARSET_FROM_ID (charset_id_1);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3270 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3271
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3272 case ISO_control_0:
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3273 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3274 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3275 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3276 charset = CHARSET_FROM_ID (charset_ascii);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3277 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3278
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3279 case ISO_control_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3280 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3281 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3282
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3283 case ISO_shift_out:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3284 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3285 || CODING_ISO_DESIGNATION (coding, 1) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3286 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3287 CODING_ISO_INVOCATION (coding, 0) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3288 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3289 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3290
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3291 case ISO_shift_in:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3292 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3293 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3294 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3295 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3296 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3297
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3298 case ISO_single_shift_2_7:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3299 case ISO_single_shift_2:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3300 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3301 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3302 /* SS2 is handled as an escape sequence of ESC 'N' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3303 c1 = 'N';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3304 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3305
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3306 case ISO_single_shift_3:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3307 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3308 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3309 /* SS2 is handled as an escape sequence of ESC 'O' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3310 c1 = 'O';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3311 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3312
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3313 case ISO_control_sequence_introducer:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3314 /* CSI is handled as an escape sequence of ESC '[' ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3315 c1 = '[';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3316 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3317
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3318 case ISO_escape:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3319 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3320 label_escape_sequence:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3321 /* Escape sequences handled here are invocation,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3322 designation, direction specification, and character
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3323 composition specification. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3324 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3325 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3326 case '&': /* revision of following character set */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3327 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3328 if (!(c1 >= '@' && c1 <= '~'))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3329 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3330 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3331 if (c1 != ISO_CODE_ESC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3332 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3333 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3334 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3335
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3336 case '$': /* designation of 2-byte character set */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3337 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3338 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3339 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3340 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3341
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3342 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3343 if (c1 >= '@' && c1 <= 'B')
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3344 { /* designation of JISX0208.1978, GB2312.1980,
23339
2da87b489590 (check_composing_code): Fix previous change. Now it
Kenichi Handa <handa@m17n.org>
parents: 23325
diff changeset
3345 or JISX0208.1980 */
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3346 reg = 0, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3347 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3348 else if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3349 { /* designation of DIMENSION2_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3350 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3351 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3352 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3353 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3354 { /* designation of DIMENSION2_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3355 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3356 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3357 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3358 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3359 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3360 DECODE_DESIGNATION (reg, 2, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3361 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3362 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3363 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3364 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3365 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3366 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3367 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3368 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3369 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3370
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3371 case 'n': /* invocation of locking-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3372 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3373 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3374 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3375 CODING_ISO_INVOCATION (coding, 0) = 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3376 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3377 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3378
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3379 case 'o': /* invocation of locking-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3380 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3381 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3382 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3383 CODING_ISO_INVOCATION (coding, 0) = 3;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3384 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3385 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3386
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3387 case 'N': /* invocation of single-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3388 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3389 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3390 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3391 charset_id_2 = CODING_ISO_DESIGNATION (coding, 2);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3392 if (charset_id_2 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3393 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3394 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3395 charset = CHARSET_FROM_ID (charset_id_2);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3396 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3397 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3398 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3399 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3400
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3401 case 'O': /* invocation of single-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3402 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3403 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3404 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3405 charset_id_3 = CODING_ISO_DESIGNATION (coding, 3);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3406 if (charset_id_3 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3407 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3408 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3409 charset = CHARSET_FROM_ID (charset_id_3);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3410 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3411 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3412 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3413 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3414
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3415 case '0': case '2': case '3': case '4': /* start composition */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3416 if (! (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3417 goto invalid_code;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3418 DECODE_COMPOSITION_START (c1);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3419 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3420
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3421 case '1': /* end composition */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3422 if (composition_state == COMPOSING_NO)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3423 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3424 DECODE_COMPOSITION_END ();
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3425 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3426
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3427 case '[': /* specification of direction */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3428 if (! CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DIRECTION)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3429 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3430 /* For the moment, nested direction is not supported.
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3431 So, `coding->mode & CODING_MODE_DIRECTION' zero means
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3432 left-to-right, and nozero means right-to-left. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3433 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3434 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3435 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3436 case ']': /* end of the current direction */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3437 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3438
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3439 case '0': /* end of the current direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3440 case '1': /* start of left-to-right direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3441 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3442 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3443 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3444 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3445 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3446 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3447
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3448 case '2': /* start of right-to-left direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3449 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3450 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3451 coding->mode |= CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3452 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3453 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3454 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3455
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3456 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3457 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3458 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3459 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3460
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3461 case '%':
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3462 ONE_MORE_BYTE (c1);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3463 if (c1 == '/')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3464 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3465 /* CTEXT extended segment:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3466 ESC % / [0-4] M L --ENCODING-NAME-- \002 --BYTES--
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3467 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3468 They may be decoded by post-read-conversion. */
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3469 int dim, M, L;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3470 int size;
56191
75f56340b4f9 (MAX_ALLOCA): Remove define.
Kim F. Storm <storm@cua.dk>
parents: 56028
diff changeset
3471
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3472 ONE_MORE_BYTE (dim);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3473 ONE_MORE_BYTE (M);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3474 ONE_MORE_BYTE (L);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3475 size = ((M - 128) * 128) + (L - 128);
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3476 if (charbuf + 8 + size > charbuf_end)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3477 goto break_loop;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3478 *charbuf++ = ISO_CODE_ESC;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3479 *charbuf++ = '%';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3480 *charbuf++ = '/';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3481 *charbuf++ = dim;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3482 *charbuf++ = BYTE8_TO_CHAR (M);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3483 *charbuf++ = BYTE8_TO_CHAR (L);
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3484 while (size-- > 0)
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3485 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3486 ONE_MORE_BYTE (c1);
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3487 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3488 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3489 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3490 else if (c1 == 'G')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3491 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3492 /* XFree86 extension for embedding UTF-8 in CTEXT:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3493 ESC % G --UTF-8-BYTES-- ESC % @
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3494 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3495 They may be decoded by post-read-conversion. */
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3496 int *p = charbuf;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3497
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3498 if (p + 6 > charbuf_end)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3499 goto break_loop;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3500 *p++ = ISO_CODE_ESC;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3501 *p++ = '%';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3502 *p++ = 'G';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3503 while (p < charbuf_end)
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3504 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3505 ONE_MORE_BYTE (c1);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3506 if (c1 == ISO_CODE_ESC
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3507 && src + 1 < src_end
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3508 && src[0] == '%'
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3509 && src[1] == '@')
53239
82690620d562 (decode_coding_iso2022): Fix for preserving UTF-8
Kenichi Handa <handa@m17n.org>
parents: 53087
diff changeset
3510 {
82690620d562 (decode_coding_iso2022): Fix for preserving UTF-8
Kenichi Handa <handa@m17n.org>
parents: 53087
diff changeset
3511 src += 2;
82690620d562 (decode_coding_iso2022): Fix for preserving UTF-8
Kenichi Handa <handa@m17n.org>
parents: 53087
diff changeset
3512 break;
82690620d562 (decode_coding_iso2022): Fix for preserving UTF-8
Kenichi Handa <handa@m17n.org>
parents: 53087
diff changeset
3513 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3514 *p++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3515 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3516 if (p + 3 > charbuf_end)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3517 goto break_loop;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3518 *p++ = ISO_CODE_ESC;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3519 *p++ = '%';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3520 *p++ = '@';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3521 charbuf = p;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3522 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3523 else
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3524 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3525 continue;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3526 break;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3527
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3528 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3529 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3530 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3531 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3532 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3533
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3534 if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3535 { /* designation of DIMENSION1_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3536 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3537 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3538 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3539 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3540 { /* designation of DIMENSION1_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3541 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3542 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3543 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3544 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3545 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3546 DECODE_DESIGNATION (reg, 1, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3547 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3548 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3549 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3550 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3551 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3552 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3553 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3554 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3555 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3556 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3557 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3558
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3559 if (charset->id != charset_ascii
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3560 && last_id != charset->id)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3561 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3562 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3563 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3564 last_id = charset->id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3565 last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3566 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3567
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3568 /* Now we know CHARSET and 1st position code C1 of a character.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3569 Produce a decoded character while getting 2nd position code
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3570 C2 if necessary. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3571 c1 &= 0x7F;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3572 if (CHARSET_DIMENSION (charset) > 1)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3573 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3574 ONE_MORE_BYTE (c2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3575 if (c2 < 0x20 || (c2 >= 0x80 && c2 < 0xA0))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3576 /* C2 is not in a valid range. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3577 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3578 c1 = (c1 << 8) | (c2 & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3579 if (CHARSET_DIMENSION (charset) > 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3580 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3581 ONE_MORE_BYTE (c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3582 if (c2 < 0x20 || (c2 >= 0x80 && c2 < 0xA0))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3583 /* C2 is not in a valid range. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3584 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3585 c1 = (c1 << 8) | (c2 & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3586 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3587 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3588
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3589 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c1, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3590 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3591 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3592 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3593 for (; src_base < src; src_base++, char_offset++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3594 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3595 if (ASCII_BYTE_P (*src_base))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3596 *charbuf++ = *src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3597 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3598 *charbuf++ = BYTE8_TO_CHAR (*src_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3599 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3600 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3601 else if (composition_state == COMPOSING_NO)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3602 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3603 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3604 char_offset++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3605 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3606 else
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3607 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3608 if (component_idx < MAX_COMPOSITION_COMPONENTS * 2 + 1)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3609 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3610 components[component_idx++] = c;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3611 if (method == COMPOSITION_WITH_RULE
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3612 || (method == COMPOSITION_WITH_RULE_ALTCHARS
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3613 && composition_state == COMPOSING_COMPONENT_CHAR))
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3614 composition_state++;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3615 }
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3616 else
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3617 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3618 MAYBE_FINISH_COMPOSITION ();
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3619 *charbuf++ = c;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3620 char_offset++;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3621 }
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3622 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3623 continue;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3624
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3625 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3626 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3627 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3628 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3629 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3630 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3631 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3632 coding->errors++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3633 continue;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3634
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3635 break_loop:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3636 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3637 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3638
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3639 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3640 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3641 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3642 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3643 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3644 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3645 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3646
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3647
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
3648 /* ISO2022 encoding stuff. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3649
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3650 /*
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
3651 It is not enough to say just "ISO2022" on encoding, we have to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3652 specify more details. In Emacs, each coding system of ISO2022
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3653 variant has the following specifications:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3654 1. Initial designation to G0 thru G3.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3655 2. Allows short-form designation?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3656 3. ASCII should be designated to G0 before control characters?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3657 4. ASCII should be designated to G0 at end of line?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3658 5. 7-bit environment or 8-bit environment?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3659 6. Use locking-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3660 7. Use Single-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3661 And the following two are only for Japanese:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3662 8. Use ASCII in place of JIS0201-1976-Roman?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3663 9. Use JISX0208-1983 in place of JISX0208-1978?
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3664 These specifications are encoded in CODING_ISO_FLAGS (coding) as flag bits
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3665 defined by macros CODING_ISO_FLAG_XXX. See `coding.h' for more
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
3666 details.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3667 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3668
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3669 /* Produce codes (escape sequence) for designating CHARSET to graphic
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3670 register REG at DST, and increment DST. If <final-char> of CHARSET is
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3671 '@', 'A', or 'B' and the coding system CODING allows, produce
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3672 designation sequence of short-form. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3673
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3674 #define ENCODE_DESIGNATION(charset, reg, coding) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3675 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3676 unsigned char final_char = CHARSET_ISO_FINAL (charset); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3677 char *intermediate_char_94 = "()*+"; \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3678 char *intermediate_char_96 = ",-./"; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3679 int revision = -1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3680 int c; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3681 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3682 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_REVISION) \
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
3683 revision = CHARSET_ISO_REVISION (charset); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3684 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3685 if (revision >= 0) \
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
3686 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3687 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '&'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3688 EMIT_ONE_BYTE ('@' + revision); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3689 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3690 EMIT_ONE_ASCII_BYTE (ISO_CODE_ESC); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3691 if (CHARSET_DIMENSION (charset) == 1) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3692 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3693 if (! CHARSET_ISO_CHARS_96 (charset)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3694 c = intermediate_char_94[reg]; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3695 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3696 c = intermediate_char_96[reg]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3697 EMIT_ONE_ASCII_BYTE (c); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3698 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3699 else \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3700 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3701 EMIT_ONE_ASCII_BYTE ('$'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3702 if (! CHARSET_ISO_CHARS_96 (charset)) \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3703 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3704 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LONG_FORM \
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3705 || reg != 0 \
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3706 || final_char < '@' || final_char > 'B') \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3707 EMIT_ONE_ASCII_BYTE (intermediate_char_94[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3708 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3709 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3710 EMIT_ONE_ASCII_BYTE (intermediate_char_96[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3711 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3712 EMIT_ONE_ASCII_BYTE (final_char); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3713 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3714 CODING_ISO_DESIGNATION (coding, reg) = CHARSET_ID (charset); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3715 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3716
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3717
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3718 /* The following two macros produce codes (control character or escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3719 sequence) for ISO2022 single-shift functions (single-shift-2 and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3720 single-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3721
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3722 #define ENCODE_SINGLE_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3723 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3724 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3725 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'N'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3726 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3727 EMIT_ONE_BYTE (ISO_CODE_SS2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3728 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3729 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3730
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3731
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3732 #define ENCODE_SINGLE_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3733 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3734 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3735 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'O'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3736 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3737 EMIT_ONE_BYTE (ISO_CODE_SS3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3738 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3739 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3740
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3741
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3742 /* The following four macros produce codes (control character or
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3743 escape sequence) for ISO2022 locking-shift functions (shift-in,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3744 shift-out, locking-shift-2, and locking-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3745
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3746 #define ENCODE_SHIFT_IN \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3747 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3748 EMIT_ONE_ASCII_BYTE (ISO_CODE_SI); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3749 CODING_ISO_INVOCATION (coding, 0) = 0; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3750 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3751
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3752
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3753 #define ENCODE_SHIFT_OUT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3754 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3755 EMIT_ONE_ASCII_BYTE (ISO_CODE_SO); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3756 CODING_ISO_INVOCATION (coding, 0) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3757 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3758
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3759
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3760 #define ENCODE_LOCKING_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3761 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3762 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3763 CODING_ISO_INVOCATION (coding, 0) = 2; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3764 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3765
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3766
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3767 #define ENCODE_LOCKING_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3768 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3769 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3770 CODING_ISO_INVOCATION (coding, 0) = 3; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3771 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3772
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3773
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
3774 /* Produce codes for a DIMENSION1 character whose character set is
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
3775 CHARSET and whose position-code is C1. Designation and invocation
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3776 sequences are also produced in advance if necessary. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3777
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3778 #define ENCODE_ISO_CHARACTER_DIMENSION1(charset, c1) \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3779 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3780 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3781 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3782 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3783 && id == charset_ascii) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3784 { \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3785 id = charset_jisx0201_roman; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3786 charset = CHARSET_FROM_ID (id); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3787 } \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3788 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3789 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3790 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3791 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3792 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3793 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3794 EMIT_ONE_BYTE (c1 | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3795 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3796 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3797 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3798 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3799 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3800 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3801 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3802 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3803 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3804 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3805 EMIT_ONE_BYTE (c1 | 0x80); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3806 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3807 } \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3808 else \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3809 /* Since CHARSET is not yet invoked to any graphic planes, we \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3810 must invoke it, or, at first, designate it to some graphic \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3811 register. Then repeat the loop to actually produce the \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
3812 character. */ \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3813 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3814 &produced_chars); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3815 } while (1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3816
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3817
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3818 /* Produce codes for a DIMENSION2 character whose character set is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3819 CHARSET and whose position-codes are C1 and C2. Designation and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3820 invocation codes are also produced in advance if necessary. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3821
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3822 #define ENCODE_ISO_CHARACTER_DIMENSION2(charset, c1, c2) \
24506
219c99669e4b (ENCODE_ISO_CHARACTER): Check validity of CHARSET. If
Kenichi Handa <handa@m17n.org>
parents: 24460
diff changeset
3823 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3824 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3825 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3826 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3827 && id == charset_jisx0208) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3828 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3829 id = charset_jisx0208_1978; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3830 charset = CHARSET_FROM_ID (id); \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3831 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3832 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3833 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3834 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3835 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3836 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3837 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3838 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3839 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3840 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3841 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3842 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3843 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3844 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3845 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3846 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3847 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3848 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3849 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3850 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3851 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3852 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3853 /* Since CHARSET is not yet invoked to any graphic planes, we \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3854 must invoke it, or, at first, designate it to some graphic \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3855 register. Then repeat the loop to actually produce the \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3856 character. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3857 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3858 &produced_chars); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3859 } while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3860
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3861
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3862 #define ENCODE_ISO_CHARACTER(charset, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3863 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3864 int code = ENCODE_CHAR ((charset),(c)); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3865 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3866 if (CHARSET_DIMENSION (charset) == 1) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3867 ENCODE_ISO_CHARACTER_DIMENSION1 ((charset), code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3868 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3869 ENCODE_ISO_CHARACTER_DIMENSION2 ((charset), code >> 8, code & 0xFF); \
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
3870 } while (0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
3871
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
3872
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3873 /* Produce designation and invocation codes at a place pointed by DST
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3874 to use CHARSET. The element `spec.iso_2022' of *CODING is updated.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3875 Return new DST. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3876
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3877 unsigned char *
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3878 encode_invocation_designation (charset, coding, dst, p_nchars)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3879 struct charset *charset;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3880 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3881 unsigned char *dst;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3882 int *p_nchars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3883 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3884 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3885 int produced_chars = *p_nchars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3886 int reg; /* graphic register number */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3887 int id = CHARSET_ID (charset);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3888
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3889 /* At first, check designations. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3890 for (reg = 0; reg < 4; reg++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3891 if (id == CODING_ISO_DESIGNATION (coding, reg))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3892 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3893
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3894 if (reg >= 4)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3895 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3896 /* CHARSET is not yet designated to any graphic registers. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3897 /* At first check the requested designation. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3898 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3899 if (reg < 0)
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
3900 /* Since CHARSET requests no special designation, designate it
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
3901 to graphic register 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3902 reg = 0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3903
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3904 ENCODE_DESIGNATION (charset, reg, coding);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3905 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3906
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3907 if (CODING_ISO_INVOCATION (coding, 0) != reg
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3908 && CODING_ISO_INVOCATION (coding, 1) != reg)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3909 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3910 /* Since the graphic register REG is not invoked to any graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3911 planes, invoke it to graphic plane 0. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3912 switch (reg)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3913 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3914 case 0: /* graphic register 0 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3915 ENCODE_SHIFT_IN;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3916 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3917
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3918 case 1: /* graphic register 1 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3919 ENCODE_SHIFT_OUT;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3920 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3921
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3922 case 2: /* graphic register 2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3923 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3924 ENCODE_SINGLE_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3925 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3926 ENCODE_LOCKING_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3927 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3928
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3929 case 3: /* graphic register 3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3930 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3931 ENCODE_SINGLE_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3932 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3933 ENCODE_LOCKING_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3934 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3935 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3936 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3937
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3938 *p_nchars = produced_chars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3939 return dst;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3940 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3941
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3942 /* The following three macros produce codes for indicating direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3943 of text. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3944 #define ENCODE_CONTROL_SEQUENCE_INTRODUCER \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3945 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3946 if (CODING_ISO_FLAGS (coding) == CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3947 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '['); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3948 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3949 EMIT_ONE_BYTE (ISO_CODE_CSI); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3950 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3951
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3952
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3953 #define ENCODE_DIRECTION_R2L() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3954 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3955 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3956 EMIT_TWO_ASCII_BYTES ('2', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3957 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3958
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3959
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3960 #define ENCODE_DIRECTION_L2R() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3961 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3962 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3963 EMIT_TWO_ASCII_BYTES ('0', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3964 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3965
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3966
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3967 /* Produce codes for designation and invocation to reset the graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3968 planes and registers to initial state. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3969 #define ENCODE_RESET_PLANE_AND_REGISTER() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3970 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3971 int reg; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3972 struct charset *charset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3973 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3974 if (CODING_ISO_INVOCATION (coding, 0) != 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3975 ENCODE_SHIFT_IN; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3976 for (reg = 0; reg < 4; reg++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3977 if (CODING_ISO_INITIAL (coding, reg) >= 0 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3978 && (CODING_ISO_DESIGNATION (coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3979 != CODING_ISO_INITIAL (coding, reg))) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3980 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3981 charset = CHARSET_FROM_ID (CODING_ISO_INITIAL (coding, reg)); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3982 ENCODE_DESIGNATION (charset, reg, coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3983 } \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3984 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3985
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3986
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
3987 /* Produce designation sequences of charsets in the line started from
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3988 SRC to a place pointed by DST, and return updated DST.
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
3989
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
3990 If the current block ends before any end-of-line, we may fail to
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3991 find all the necessary designations. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3992
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3993 static unsigned char *
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3994 encode_designation_at_bol (coding, charbuf, charbuf_end, dst)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
3995 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3996 int *charbuf, *charbuf_end;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
3997 unsigned char *dst;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
3998 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3999 struct charset *charset;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4000 /* Table of charsets to be designated to each graphic register. */
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4001 int r[4];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4002 int c, found = 0, reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4003 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4004 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4005 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4006 Lisp_Object charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4007
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4008 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4009 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4010 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4011 charset_list = Viso_2022_charset_list;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4012
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4013 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4014 r[reg] = -1;
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4015
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4016 while (found < 4)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4017 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4018 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4019
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4020 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4021 if (c == '\n')
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4022 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4023 charset = char_charset (c, charset_list, NULL);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4024 id = CHARSET_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4025 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4026 if (reg >= 0 && r[reg] < 0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4027 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4028 found++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4029 r[reg] = id;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4030 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4031 }
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4032
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4033 if (found)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4034 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4035 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4036 if (r[reg] >= 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4037 && CODING_ISO_DESIGNATION (coding, reg) != r[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4038 ENCODE_DESIGNATION (CHARSET_FROM_ID (r[reg]), reg, coding);
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4039 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4040
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4041 return dst;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4042 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4043
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4044 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4045
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4046 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4047 encode_coding_iso_2022 (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4048 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4049 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4050 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4051 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4052 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4053 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4054 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4055 int safe_room = 16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4056 int bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4057 = (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4058 && CODING_ISO_BOL (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4059 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4060 Lisp_Object attrs, eol_type, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4061 int ascii_compatible;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4062 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4063 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4064
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4065 CODING_GET_INFO (coding, attrs, charset_list);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4066 eol_type = CODING_ID_EOL_TYPE (coding->id);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4067 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4068 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4069
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
4070 setup_iso_safe_charsets (attrs);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4071 /* Charset list may have been changed. */
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
4072 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4073 coding->safe_charsets = (char *) SDATA (CODING_ATTR_SAFE_CHARSETS(attrs));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4074
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4075 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4076
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4077 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4078 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4079 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4080
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4081 if (bol_designation)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4082 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4083 unsigned char *dst_prev = dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4084
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4085 /* We have to produce designation sequences if any now. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4086 dst = encode_designation_at_bol (coding, charbuf, charbuf_end, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4087 bol_designation = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4088 /* We are sure that designation sequences are all ASCII bytes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4089 produced_chars += dst - dst_prev;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4090 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4091
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4092 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4093
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4094 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4095 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4096 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4097 switch (*charbuf)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4098 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4099 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4100 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4101 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4102 case CODING_ANNOTATE_CHARSET_MASK:
90014
ade0c9a12f99 (encode_coding_iso_2022): Fix handling of charset
Kenichi Handa <handa@m17n.org>
parents: 90011
diff changeset
4103 preferred_charset_id = charbuf[2];
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4104 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4105 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4106 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4107 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4108 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4109 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4110 abort ();
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
4111 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4112 charbuf += -c - 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4113 continue;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4114 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4115
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4116 /* Now encode the character C. */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4117 if (c < 0x20 || c == 0x7F)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4118 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4119 if (c == '\n'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4120 || (c == '\r' && EQ (eol_type, Qmac)))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4121 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4122 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4123 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4124 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_INIT_AT_BOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4125 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4126 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4127
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4128 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4129 CODING_ISO_DESIGNATION (coding, i)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4130 = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4131 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4132 bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4133 = CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL;
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4134 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4135 else if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_CNTL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4136 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4137 EMIT_ONE_ASCII_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4138 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4139 else if (ASCII_CHAR_P (c))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4140 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4141 if (ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4142 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4143 else
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4144 {
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4145 struct charset *charset = CHARSET_FROM_ID (charset_ascii);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4146 ENCODE_ISO_CHARACTER (charset, c);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4147 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4148 }
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4149 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4150 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4151 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4152 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4153 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4154 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4155 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4156 struct charset *charset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4157
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4158 if (preferred_charset_id >= 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4159 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4160 charset = CHARSET_FROM_ID (preferred_charset_id);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4161 if (! CHAR_CHARSET_P (c, charset))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4162 charset = char_charset (c, charset_list, NULL);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4163 }
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
4164 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4165 charset = char_charset (c, charset_list, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4166 if (!charset)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4167 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4168 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4169 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4170 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4171 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4172 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4173 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4174 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4175 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4176 charset = char_charset (c, charset_list, NULL);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4177 }
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4178 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4179 ENCODE_ISO_CHARACTER (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4180 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4181 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4182
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4183 if (coding->mode & CODING_MODE_LAST_BLOCK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4184 && CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4185 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4186 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4187 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4188 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4189 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4190 CODING_ISO_BOL (coding) = bol_designation;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4191 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4192 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4193 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4194 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4195
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4196
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4197 /*** 8,9. SJIS and BIG5 handlers ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4198
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4199 /* Although SJIS and BIG5 are not ISO's coding system, they are used
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4200 quite widely. So, for the moment, Emacs supports them in the bare
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4201 C code. But, in the future, they may be supported only by CCL. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4202
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4203 /* SJIS is a coding system encoding three character sets: ASCII, right
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4204 half of JISX0201-Kana, and JISX0208. An ASCII character is encoded
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4205 as is. A character of charset katakana-jisx0201 is encoded by
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4206 "position-code + 0x80". A character of charset japanese-jisx0208
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4207 is encoded in 2-byte but two position-codes are divided and shifted
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4208 so that it fit in the range below.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4209
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4210 --- CODE RANGE of SJIS ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4211 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4212 ASCII 0x00 .. 0x7F
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4213 KATAKANA-JISX0201 0xA0 .. 0xDF
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
4214 JISX0208 (1st byte) 0x81 .. 0x9F and 0xE0 .. 0xEF
23564
6eb3e346d1fd (DECODE_CHARACTER_ASCII): Check validity of inserted
Kenichi Handa <handa@m17n.org>
parents: 23542
diff changeset
4215 (2nd byte) 0x40 .. 0x7E and 0x80 .. 0xFC
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4216 -------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4217
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4218 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4219
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4220 /* BIG5 is a coding system encoding two character sets: ASCII and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4221 Big5. An ASCII character is encoded as is. Big5 is a two-byte
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4222 character set and is encoded in two-byte.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4223
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4224 --- CODE RANGE of BIG5 ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4225 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4226 ASCII 0x00 .. 0x7F
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4227 Big5 (1st byte) 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4228 (2nd byte) 0x40 .. 0x7E and 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4229 --------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4230
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4231 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4232
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4233 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4234 Check if a text is encoded in SJIS. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4235 CATEGORY_MASK_SJIS, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4236
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4237 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4238 detect_coding_sjis (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4239 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4240 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4241 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4242 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4243 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4244 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4245 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4246 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4247 int c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4248
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4249 detect_info->checked |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4250 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4251 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4252
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4253 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4254 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4255 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4256 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4257 if (c < 0x80)
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4258 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4259 if ((c >= 0x81 && c <= 0x9F) || (c >= 0xE0 && c <= 0xEF))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4260 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4261 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4262 if (c < 0x40 || c == 0x7F || c > 0xFC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4263 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4264 found = CATEGORY_MASK_SJIS;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4265 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4266 else if (c >= 0xA0 && c < 0xE0)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4267 found = CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4268 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4269 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4270 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4271 detect_info->rejected |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4272 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4273
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4274 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4275 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4276 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4277 detect_info->rejected |= CATEGORY_MASK_SJIS;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4278 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4279 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4280 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4281 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4282 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4283
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4284 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4285 Check if a text is encoded in BIG5. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4286 CATEGORY_MASK_BIG5, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4287
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4288 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4289 detect_coding_big5 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4290 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4291 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4292 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4293 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4294 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4295 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4296 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4297 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4298 int c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4299
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4300 detect_info->checked |= CATEGORY_MASK_BIG5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4301 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4302 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4303
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4304 while (1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4305 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4306 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4307 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4308 if (c < 0x80)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4309 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4310 if (c >= 0xA1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4311 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4312 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4313 if (c < 0x40 || (c >= 0x7F && c <= 0xA0))
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4314 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4315 found = CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4316 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4317 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4318 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4319 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4320 detect_info->rejected |= CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4321 return 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4322
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4323 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4324 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4325 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4326 detect_info->rejected |= CATEGORY_MASK_BIG5;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4327 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4328 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4329 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4330 return 1;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4331 }
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4332
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4333 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4334 If SJIS_P is 1, decode SJIS text, else decode BIG5 test. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4335
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4336 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4337 decode_coding_sjis (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4338 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4339 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4340 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4341 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
4342 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4343 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4344 int *charbuf_end
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4345 = coding->charbuf + coding->charbuf_size - MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4346 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4347 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4348 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4349 struct charset *charset_kanji2;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4350 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4351 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4352 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4353 int last_id = charset_ascii;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4354 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4355 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4356
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4357 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4358
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4359 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4360 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4361 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4362 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4363 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4364
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4365 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4366 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4367 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4368 struct charset *charset;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4369
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4370 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4371 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4372
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4373 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4374 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4375
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4376 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4377 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4378 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4379 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4380 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4381 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4382 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4383 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4384 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4385 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4386 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4387 }
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4388 else if (c == 0x80 || c == 0xA0)
89730
d8fcefca5cf6 (decode_coding_sjis): Check the first byte rigidly.
Kenichi Handa <handa@m17n.org>
parents: 89686
diff changeset
4389 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4390 else if (c >= 0xA1 && c <= 0xDF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4391 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4392 /* SJIS -> JISX0201-Kana */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4393 c &= 0x7F;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4394 charset = charset_kana;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4395 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4396 else if (c <= 0xEF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4397 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4398 /* SJIS -> JISX0208 */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4399 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4400 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4401 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4402 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4403 SJIS_TO_JIS (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4404 charset = charset_kanji;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4405 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4406 else if (c <= 0xFC && charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4407 {
89779
74c503490829 (decode_coding_sjis): Fix comment.
Kenichi Handa <handa@m17n.org>
parents: 89764
diff changeset
4408 /* SJIS -> JISX0213-2 */
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4409 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4410 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4411 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4412 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4413 SJIS_TO_JIS2 (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4414 charset = charset_kanji2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4415 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4416 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4417 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4418 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4419 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4420 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4421 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4422 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4423 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4424 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4425 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4426 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4427 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4428 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4429 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4430
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4431 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4432 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4433 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4434 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4435 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4436 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4437 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4438 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4439
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4440 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4441 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4442 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4443 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4444 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4445 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4446 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4447
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4448 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4449 decode_coding_big5 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4450 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4451 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4452 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4453 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4454 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4455 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4456 int *charbuf_end
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4457 = coding->charbuf + coding->charbuf_size - MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4458 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4459 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4460 struct charset *charset_roman, *charset_big5;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4461 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4462 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4463 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4464 int last_id = charset_ascii;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4465 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4466 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4467
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4468 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4469 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4470 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4471 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4472
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4473 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4474 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4475 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4476 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4477
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4478 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4479 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4480
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4481 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4482 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4483
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4484 if (byte_after_cr >= 0)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4485 c = byte_after_cr, byte_after_cr = -1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4486 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4487 ONE_MORE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4488
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4489 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4490 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4491 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4492 {
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4493 if (eol_crlf && c == '\r')
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4494 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4495 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4496 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4497 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4498 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4499 /* BIG5 -> Big5 */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4500 if (c < 0xA1 || c > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4501 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4502 ONE_MORE_BYTE (c1);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4503 if (c1 < 0x40 || (c1 > 0x7E && c1 < 0xA1) || c1 > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4504 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4505 c = c << 8 | c1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4506 charset = charset_big5;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4507 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4508 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4509 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4510 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4511 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4512 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4513 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4514 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4515 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4516 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4517 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4518 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4519 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4520
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4521 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4522 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4523 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4524 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4525 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4526 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4527 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4528 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4529
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4530 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4531 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4532 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4533 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4534 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4535 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4536 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4537
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4538 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions".
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4539 This function can encode charsets `ascii', `katakana-jisx0201',
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4540 `japanese-jisx0208', `chinese-big5-1', and `chinese-big5-2'. We
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4541 are sure that all these charsets are registered as official charset
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4542 (i.e. do not have extended leading-codes). Characters of other
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4543 charsets are produced without any encoding. If SJIS_P is 1, encode
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4544 SJIS text, else encode BIG5 text. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4545
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4546 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4547 encode_coding_sjis (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4548 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4549 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4550 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4551 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4552 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4553 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4554 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4555 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4556 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4557 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4558 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4559 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4560 struct charset *charset_kanji2;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4561 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4562
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4563 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4564 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4565 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4566 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4567 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4568 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4569
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4570 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4571
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4572 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4573 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4574 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4575 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4576 /* Now encode the character C. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4577 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4578 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4579 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4580 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4581 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4582 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4583 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4584 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4585 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4586 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4587 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4588
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4589 if (!charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4590 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4591 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4592 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4593 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4594 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4595 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4596 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4597 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4598 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4599 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4600 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4601 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4602 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4603 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4604 if (charset == charset_kanji)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4605 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4606 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4607 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4608 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4609 EMIT_TWO_BYTES (c1, c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4610 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4611 else if (charset == charset_kana)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4612 EMIT_ONE_BYTE (code | 0x80);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4613 else if (charset_kanji2 && charset == charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4614 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4615 int c1, c2;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4616
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4617 c1 = code >> 8;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4618 if (c1 == 0x21 || (c1 >= 0x23 && c1 < 0x25)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4619 || (c1 >= 0x2C && c1 <= 0x2F) || c1 >= 0x6E)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4620 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4621 JIS_TO_SJIS2 (code);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4622 c1 = code >> 8, c2 = code & 0xFF;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4623 EMIT_TWO_BYTES (c1, c2);
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4624 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4625 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4626 EMIT_ONE_ASCII_BYTE (code & 0x7F);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4627 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4628 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4629 EMIT_ONE_ASCII_BYTE (code & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4630 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4631 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4632 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4633 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4634 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4635 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4636 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4637
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4638 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4639 encode_coding_big5 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4640 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4641 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4642 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4643 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4644 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4645 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4646 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4647 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4648 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4649 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4650 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4651 struct charset *charset_roman, *charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4652 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4653
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4654 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4655 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4656 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4657 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4658 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4659
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4660 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4661 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4662 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4663 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4664 /* Now encode the character C. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4665 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4666 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4667 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4668 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4669 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4670 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4671 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4672 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4673 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4674 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4675 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4676
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4677 if (! charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4678 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4679 if (coding->mode & CODING_MODE_SAFE_ENCODING)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4680 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4681 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4682 charset = CHARSET_FROM_ID (charset_ascii);
51140
94d903190cee (ENCODE_UNSAFE_CHARACTER): Adjusted for the name change
Kenichi Handa <handa@m17n.org>
parents: 51090
diff changeset
4683 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4684 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4685 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4686 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4687 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4688 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4689 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4690 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4691 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4692 if (charset == charset_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4693 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4694 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4695
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4696 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4697 EMIT_TWO_BYTES (c1, c2);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4698 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4699 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4700 EMIT_ONE_ASCII_BYTE (code & 0x7F);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4701 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4702 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4703 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4704 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4705 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4706 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4707 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4708
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4709
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4710 /*** 10. CCL handlers ***/
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4711
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4712 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4713 Check if a text is encoded in a coding system of which
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4714 encoder/decoder are written in CCL program. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4715 CATEGORY_MASK_CCL, else return 0. */
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4716
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4717 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4718 detect_coding_ccl (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4719 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4720 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4721 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4722 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4723 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4724 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4725 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4726 int found = 0;
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
4727 unsigned char *valids;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4728 int head_ascii = coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4729 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4730
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4731 detect_info->checked |= CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4732
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4733 coding = &coding_categories[coding_category_ccl];
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
4734 valids = CODING_CCL_VALIDS (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4735 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4736 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4737 src += head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4738
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4739 while (1)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4740 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4741 int c;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4742
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4743 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4744 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4745 if (c < 0 || ! valids[c])
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4746 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4747 if ((valids[c] > 1))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4748 found = CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4749 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4750 detect_info->rejected |= CATEGORY_MASK_CCL;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4751 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4752
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4753 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4754 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4755 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4756 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4757
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4758 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4759 decode_coding_ccl (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4760 struct coding_system *coding;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4761 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
4762 const unsigned char *src = coding->source + coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4763 const unsigned char *src_end = coding->source + coding->src_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4764 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4765 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4766 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4767 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4768 struct ccl_program ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4769 int source_charbuf[1024];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4770 int source_byteidx[1024];
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4771 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4772
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4773 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4774 setup_ccl_program (&ccl, CODING_CCL_DECODER (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4775
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4776 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4777 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
4778 const unsigned char *p = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4779 int *source, *source_end;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4780 int i = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4781
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4782 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4783 while (i < 1024 && p < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4784 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4785 source_byteidx[i] = p - src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4786 source_charbuf[i++] = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4787 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4788 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4789 while (i < 1024 && p < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4790 source_charbuf[i++] = *p++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4791
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4792 if (p == src_end && coding->mode & CODING_MODE_LAST_BLOCK)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4793 ccl.last_block = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4794
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4795 source = source_charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4796 source_end = source + i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4797 while (source < source_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4798 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4799 ccl_driver (&ccl, source, charbuf,
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
4800 source_end - source, charbuf_end - charbuf,
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
4801 charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4802 source += ccl.consumed;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4803 charbuf += ccl.produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4804 if (ccl.status != CCL_STAT_SUSPEND_BY_DST)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4805 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4806 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4807 if (source < source_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4808 src += source_byteidx[source - source_charbuf];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4809 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4810 src = p;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4811 consumed_chars += source - source_charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4812
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4813 if (ccl.status != CCL_STAT_SUSPEND_BY_SRC
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4814 && ccl.status != CODING_RESULT_INSUFFICIENT_SRC)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4815 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4816 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4817
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4818 switch (ccl.status)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4819 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4820 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4821 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4822 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4823 case CCL_STAT_SUSPEND_BY_DST:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4824 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4825 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4826 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4827 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4828 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4829 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4830 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4831 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4832 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4833 coding->consumed_char += consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4834 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4835 coding->charbuf_used = charbuf - coding->charbuf;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4836 }
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4837
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4838 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4839 encode_coding_ccl (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4840 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4841 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4842 struct ccl_program ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4843 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4844 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4845 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4846 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4847 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4848 int destination_charbuf[1024];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4849 int i, produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4850 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4851
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4852 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4853 setup_ccl_program (&ccl, CODING_CCL_ENCODER (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4854
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4855 ccl.last_block = coding->mode & CODING_MODE_LAST_BLOCK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4856 ccl.dst_multibyte = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4857
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4858 while (charbuf < charbuf_end)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4859 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4860 ccl_driver (&ccl, charbuf, destination_charbuf,
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4861 charbuf_end - charbuf, 1024, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4862 if (multibytep)
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4863 {
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4864 ASSURE_DESTINATION (ccl.produced * 2);
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4865 for (i = 0; i < ccl.produced; i++)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4866 EMIT_ONE_BYTE (destination_charbuf[i] & 0xFF);
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4867 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4868 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4869 {
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4870 ASSURE_DESTINATION (ccl.produced);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
4871 for (i = 0; i < ccl.produced; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4872 *dst++ = destination_charbuf[i] & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4873 produced_chars += ccl.produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4874 }
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4875 charbuf += ccl.consumed;
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4876 if (ccl.status == CCL_STAT_QUIT
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4877 || ccl.status == CCL_STAT_INVALID_CMD)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
4878 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4879 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4880
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4881 switch (ccl.status)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4882 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4883 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4884 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4885 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4886 case CCL_STAT_SUSPEND_BY_DST:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4887 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4888 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4889 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4890 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4891 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4892 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4893 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4894 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4895 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4896 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4897
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4898 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4899 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4900 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4901 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4902
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4903
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
4904
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4905 /*** 10, 11. no-conversion handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4906
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4907 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4908
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4909 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4910 decode_coding_raw_text (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4911 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4912 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4913 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4914
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4915 coding->chars_at_source = 1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4916 coding->consumed_char = coding->src_chars;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4917 coding->consumed = coding->src_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4918 if (eol_crlf && coding->source[coding->src_bytes - 1] == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4919 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4920 coding->consumed_char--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4921 coding->consumed--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4922 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4923 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4924 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4925 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4926 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4927
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4928 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4929 encode_coding_raw_text (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4930 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4931 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4932 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4933 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4934 int *charbuf_end = coding->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4935 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4936 unsigned char *dst_end = coding->destination + coding->dst_bytes;
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
4937 int produced_chars = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4938 int c;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4939
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4940 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4941 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4942 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4943
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4944 if (coding->src_multibyte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4945 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4946 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4947 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4948 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4949 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4950 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4951 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4952 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4953 c = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4954 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4955 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4956 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4957 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4958 unsigned char str[MAX_MULTIBYTE_LENGTH], *p0 = str, *p1 = str;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4959
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4960 CHAR_STRING_ADVANCE (c, p1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4961 while (p0 < p1)
88950
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
4962 {
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
4963 EMIT_ONE_BYTE (*p0);
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
4964 p0++;
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
4965 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4966 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4967 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4968 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4969 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4970 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4971 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4972 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4973 EMIT_ONE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4974 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4975 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4976 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4977 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4978 if (coding->src_multibyte)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4979 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4980 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4981
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4982 while (charbuf < charbuf_end)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4983 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4984 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4985 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4986 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4987 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4988 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4989 *dst++ = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4990 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4991 CHAR_STRING_ADVANCE (c, dst);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4992 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4993 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4994 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4995 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4996 ASSURE_DESTINATION (charbuf_end - charbuf);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4997 while (charbuf < charbuf_end && dst < dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4998 *dst++ = *charbuf++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4999 }
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
5000 produced_chars = dst - (coding->destination + coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5001 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5002 record_conversion_result (coding, CODING_RESULT_SUCCESS);
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
5003 coding->produced_char += produced_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5004 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5005 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5006 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5007
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5008 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5009 Check if a text is encoded in a charset-based coding system. If it
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5010 is, return 1, else return 0. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5011
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5012 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5013 detect_coding_charset (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5014 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5015 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5016 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5017 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5018 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5019 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5020 int consumed_chars = 0;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5021 Lisp_Object attrs, valids, name;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5022 int found = 0;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5023 int head_ascii = coding->head_ascii;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5024 int check_latin_extra = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5025
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5026 detect_info->checked |= CATEGORY_MASK_CHARSET;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5027
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5028 coding = &coding_categories[coding_category_charset];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5029 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5030 valids = AREF (attrs, coding_attr_charset_valids);
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5031 name = CODING_ID_NAME (coding->id);
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5032 if (VECTORP (Vlatin_extra_code_table)
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5033 && strcmp ((char *) SDATA (SYMBOL_NAME (name)), "iso-8859-"))
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5034 check_latin_extra = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5035 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5036 src += head_ascii;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5037
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5038 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5039 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5040 int c;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5041 Lisp_Object val;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5042 struct charset *charset;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5043 int dim, idx;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5044
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5045 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5046 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5047 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5048 continue;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5049 val = AREF (valids, c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5050 if (NILP (val))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5051 break;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5052 if (c >= 0x80)
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5053 {
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5054 if (c < 0xA0
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5055 && check_latin_extra
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5056 && NILP (XVECTOR (Vlatin_extra_code_table)->contents[c]))
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5057 break;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5058 found = CATEGORY_MASK_CHARSET;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5059 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5060 if (INTEGERP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5061 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5062 charset = CHARSET_FROM_ID (XFASTINT (val));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5063 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5064 for (idx = 1; idx < dim; idx++)
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5065 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5066 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5067 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5068 ONE_MORE_BYTE (c);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
5069 if (c < charset->code_space[(dim - 1 - idx) * 2]
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5070 || c > charset->code_space[(dim - 1 - idx) * 2 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5071 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5072 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5073 if (idx < dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5074 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5075 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5076 else
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5077 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5078 idx = 1;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5079 for (; CONSP (val); val = XCDR (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5080 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5081 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5082 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5083 while (idx < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5084 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5085 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5086 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5087 ONE_MORE_BYTE (c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5088 if (c < charset->code_space[(dim - 1 - idx) * 4]
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5089 || c > charset->code_space[(dim - 1 - idx) * 4 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5090 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5091 idx++;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5092 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5093 if (idx == dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5094 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5095 val = Qnil;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5096 break;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5097 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5098 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5099 if (CONSP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5100 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5101 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5102 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5103 too_short:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5104 detect_info->rejected |= CATEGORY_MASK_CHARSET;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5105 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5106
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5107 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5108 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5109 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5110 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5111
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5112 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5113 decode_coding_charset (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5114 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5115 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5116 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5117 const unsigned char *src_end = coding->source + coding->src_bytes;
46548
cb1914307488 (encode_eol, detect_coding, detect_eol):
Ken Raeburn <raeburn@raeburn.org>
parents: 46462
diff changeset
5118 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5119 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5120 int *charbuf_end
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5121 = coding->charbuf + coding->charbuf_size - MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5122 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5123 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5124 Lisp_Object attrs, charset_list, valids;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5125 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5126 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5127 int last_id = charset_ascii;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5128 int eol_crlf = EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5129 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5130
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5131 CODING_GET_INFO (coding, attrs, charset_list);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5132 valids = AREF (attrs, coding_attr_charset_valids);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5133
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5134 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5135 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5136 int c;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5137 Lisp_Object val;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5138 struct charset *charset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5139 int dim;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5140 int len = 1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5141 unsigned code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5142
29093
176708661b08 (encode_eol): Fix a bug of DOS style EOL encoding.
Kenichi Handa <handa@m17n.org>
parents: 29005
diff changeset
5143 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5144 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5145
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5146 if (charbuf >= charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5147 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5148
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5149 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5150 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5151 c = byte_after_cr;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5152 byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5153 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5154 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5155 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5156 ONE_MORE_BYTE (c);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5157 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5158 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5159 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5160 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5161 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5162 code = c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5163
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5164 val = AREF (valids, c);
100170
86455974b971 (decode_coding_charset): Check type of an element of
Kenichi Handa <handa@m17n.org>
parents: 100135
diff changeset
5165 if (! INTEGERP (val) && ! CONSP (val))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5166 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5167 if (INTEGERP (val))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5168 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5169 charset = CHARSET_FROM_ID (XFASTINT (val));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5170 dim = CHARSET_DIMENSION (charset);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5171 while (len < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5172 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5173 ONE_MORE_BYTE (c);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5174 code = (code << 8) | c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5175 len++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5176 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5177 CODING_DECODE_CHAR (coding, src, src_base, src_end,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5178 charset, code, c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5179 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5180 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5181 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5182 /* VAL is a list of charset IDs. It is assured that the
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5183 list is sorted by charset dimensions (smaller one
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5184 comes first). */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5185 while (CONSP (val))
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5186 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5187 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
5188 dim = CHARSET_DIMENSION (charset);
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5189 while (len < dim)
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5190 {
88598
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5191 ONE_MORE_BYTE (c);
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5192 code = (code << 8) | c;
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5193 len++;
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5194 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5195 CODING_DECODE_CHAR (coding, src, src_base,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5196 src_end, charset, code, c);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5197 if (c >= 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5198 break;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5199 val = XCDR (val);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5200 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5201 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5202 if (c < 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5203 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5204 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5205 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5206 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5207 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5208 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5209 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5210 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5211 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5212
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5213 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5214 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5215 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5216
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5217 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5218 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5219 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5220 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5221 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5222 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5223 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5224 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5225
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5226 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5227 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5228 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5229 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5230 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5231 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5232 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5233
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5234 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5235 encode_coding_charset (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5236 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5237 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5238 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5239 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5240 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5241 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5242 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5243 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5244 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5245 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5246 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5247 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5248
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5249 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5250 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5251
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5252 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5253 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5254 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5255 unsigned code;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5256
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5257 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5258 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5259 if (ascii_compatible && ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5260 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5261 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5262 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5263 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5264 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5265 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5266 else
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5267 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5268 charset = char_charset (c, charset_list, &code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5269 if (charset)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5270 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5271 if (CHARSET_DIMENSION (charset) == 1)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5272 EMIT_ONE_BYTE (code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5273 else if (CHARSET_DIMENSION (charset) == 2)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5274 EMIT_TWO_BYTES (code >> 8, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5275 else if (CHARSET_DIMENSION (charset) == 3)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5276 EMIT_THREE_BYTES (code >> 16, (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5277 else
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5278 EMIT_FOUR_BYTES (code >> 24, (code >> 16) & 0xFF,
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5279 (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5280 }
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5281 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5282 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5283 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5284 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5285 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5286 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5287 EMIT_ONE_BYTE (c);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5288 }
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5289 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5290 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5291
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5292 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5293 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5294 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5295 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5296 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5297
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5298
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5299 /*** 7. C library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5300
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5301 /* Setup coding context CODING from information about CODING_SYSTEM.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5302 If CODING_SYSTEM is nil, `no-conversion' is assumed. If
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5303 CODING_SYSTEM is invalid, signal an error. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5304
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5305 void
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5306 setup_coding_system (coding_system, coding)
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5307 Lisp_Object coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5308 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5309 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5310 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5311 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5312 Lisp_Object coding_type;
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
5313 Lisp_Object val;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5314
24460
be35d27a4bfb (setup_coding_system): Check for CODING_SYSTEM = nil.
Kenichi Handa <handa@m17n.org>
parents: 24425
diff changeset
5315 if (NILP (coding_system))
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
5316 coding_system = Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5317
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5318 CHECK_CODING_SYSTEM_GET_ID (coding_system, coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5319
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5320 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5321 eol_type = CODING_ID_EOL_TYPE (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5322
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5323 coding->mode = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5324 coding->head_ascii = -1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5325 if (VECTORP (eol_type))
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5326 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5327 | CODING_REQUIRE_DETECTION_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5328 else if (! EQ (eol_type, Qunix))
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5329 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5330 | CODING_REQUIRE_ENCODING_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5331 else
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5332 coding->common_flags = 0;
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5333 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5334 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5335 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5336 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5337 if (! NILP (CODING_ATTR_FOR_UNIBYTE (attrs)))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5338 coding->common_flags |= CODING_FOR_UNIBYTE_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5339
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5340 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5341 coding->max_charset_id = SCHARS (val) - 1;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5342 coding->safe_charsets = (char *) SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5343 coding->default_char = XINT (CODING_ATTR_DEFAULT_CHAR (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5344
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5345 coding_type = CODING_ATTR_TYPE (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5346 if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5347 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5348 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5349 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5350 coding->encoder = encode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5351 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5352 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5353 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5354 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5355 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5356 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5357
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5358 /* Invoke graphic register 0 to plane 0. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5359 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5360 /* Invoke graphic register 1 to plane 1 if we can use 8-bit. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5361 CODING_ISO_INVOCATION (coding, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5362 = (flags & CODING_ISO_FLAG_SEVEN_BITS ? -1 : 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5363 /* Setup the initial status of designation. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5364 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5365 CODING_ISO_DESIGNATION (coding, i) = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5366 /* Not single shifting initially. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5367 CODING_ISO_SINGLE_SHIFTING (coding) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5368 /* Beginning of buffer should also be regarded as bol. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5369 CODING_ISO_BOL (coding) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5370 coding->detector = detect_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5371 coding->decoder = decode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5372 coding->encoder = encode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5373 if (flags & CODING_ISO_FLAG_SAFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5374 coding->mode |= CODING_MODE_SAFE_ENCODING;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5375 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5376 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5377 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5378 if (flags & CODING_ISO_FLAG_COMPOSITION)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5379 coding->common_flags |= CODING_ANNOTATE_COMPOSITION_MASK;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5380 if (flags & CODING_ISO_FLAG_DESIGNATION)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5381 coding->common_flags |= CODING_ANNOTATE_CHARSET_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5382 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5383 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5384 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5385 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5386 coding->max_charset_id = SCHARS (val) - 1;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5387 coding->safe_charsets = (char *) SDATA (val);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5388 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5389 CODING_ISO_FLAGS (coding) = flags;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5390 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5391 else if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5392 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5393 coding->detector = detect_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5394 coding->decoder = decode_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5395 coding->encoder = encode_coding_charset;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5396 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5397 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5398 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5399 else if (EQ (coding_type, Qutf_8))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5400 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5401 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5402 CODING_UTF_8_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5403 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5404 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5405 coding->detector = detect_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5406 coding->decoder = decode_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5407 coding->encoder = encode_coding_utf_8;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5408 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5409 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5410 if (CODING_UTF_8_BOM (coding) == utf_detect_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5411 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5412 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5413 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5414 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5415 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5416 CODING_UTF_16_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5417 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5418 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5419 val = AREF (attrs, coding_attr_utf_16_endian);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5420 CODING_UTF_16_ENDIAN (coding) = (EQ (val, Qbig) ? utf_16_big_endian
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5421 : utf_16_little_endian);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
5422 CODING_UTF_16_SURROGATE (coding) = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5423 coding->detector = detect_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5424 coding->decoder = decode_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5425 coding->encoder = encode_coding_utf_16;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5426 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5427 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5428 if (CODING_UTF_16_BOM (coding) == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5429 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5430 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5431 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5432 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5433 coding->detector = detect_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5434 coding->decoder = decode_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5435 coding->encoder = encode_coding_ccl;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5436 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5437 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5438 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5439 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5440 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5441 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5442 coding->detector = detect_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5443 coding->decoder = decode_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5444 coding->encoder = encode_coding_emacs_mule;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5445 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5446 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5447 if (! NILP (AREF (attrs, coding_attr_emacs_mule_full))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5448 && ! EQ (CODING_ATTR_CHARSET_LIST (attrs), Vemacs_mule_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5449 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5450 Lisp_Object tail, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5451 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5452
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5453 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5454 tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5455 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5456 max_charset_id = XFASTINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5457 safe_charsets = Fmake_string (make_number (max_charset_id + 1),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5458 make_number (255));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5459 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5460 tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5461 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5462 coding->max_charset_id = max_charset_id;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5463 coding->safe_charsets = (char *) SDATA (safe_charsets);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5464 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5465 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5466 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5467 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5468 coding->detector = detect_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5469 coding->decoder = decode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5470 coding->encoder = encode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5471 coding->common_flags
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5472 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5473 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5474 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5475 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5476 coding->detector = detect_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5477 coding->decoder = decode_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5478 coding->encoder = encode_coding_big5;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5479 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5480 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5481 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5482 else /* EQ (coding_type, Qraw_text) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5483 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5484 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5485 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5486 coding->encoder = encode_coding_raw_text;
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5487 if (! EQ (eol_type, Qunix))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5488 {
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5489 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5490 if (! VECTORP (eol_type))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5491 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5492 }
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5493
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5494 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5495
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5496 return;
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5497 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5498
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5499 /* Return a list of charsets supported by CODING. */
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5500
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5501 Lisp_Object
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5502 coding_charset_list (coding)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5503 struct coding_system *coding;
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5504 {
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
5505 Lisp_Object attrs, charset_list;
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5506
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5507 CODING_GET_INFO (coding, attrs, charset_list);
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5508 if (EQ (CODING_ATTR_TYPE (attrs), Qiso_2022))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5509 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5510 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5511
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5512 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5513 charset_list = Viso_2022_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5514 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5515 else if (EQ (CODING_ATTR_TYPE (attrs), Qemacs_mule))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5516 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5517 charset_list = Vemacs_mule_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5518 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5519 return charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5520 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5521
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5522
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5523 /* Return raw-text or one of its subsidiaries that has the same
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5524 eol_type as CODING-SYSTEM. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5525
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5526 Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5527 raw_text_coding_system (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5528 Lisp_Object coding_system;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5529 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
5530 Lisp_Object spec, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5531 Lisp_Object eol_type, raw_text_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5532
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5533 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5534 return Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5535 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5536 attrs = AREF (spec, 0);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5537
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5538 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5539 return coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5540
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5541 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5542 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5543 return Qraw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5544 spec = CODING_SYSTEM_SPEC (Qraw_text);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5545 raw_text_eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5546 return (EQ (eol_type, Qunix) ? AREF (raw_text_eol_type, 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5547 : EQ (eol_type, Qdos) ? AREF (raw_text_eol_type, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5548 : AREF (raw_text_eol_type, 2));
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5549 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5550
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5551
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5552 /* If CODING_SYSTEM doesn't specify end-of-line format but PARENT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5553 does, return one of the subsidiary that has the same eol-spec as
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5554 PARENT. Otherwise, return CODING_SYSTEM. If PARENT is nil,
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5555 inherit end-of-line format from the system's setting
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5556 (system_eol_type). */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5557
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5558 Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5559 coding_inherit_eol_type (coding_system, parent)
88473
b47ee8b1ce03 (coding_inherit_eol_type)
Dave Love <fx@gnu.org>
parents: 88465
diff changeset
5560 Lisp_Object coding_system, parent;
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5561 {
89545
4f394eed6ff2 (inhibit_pre_post_conversion): Removed (unused).
Dave Love <fx@gnu.org>
parents: 89519
diff changeset
5562 Lisp_Object spec, eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5563
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5564 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
5565 coding_system = Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5566 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5567 eol_type = AREF (spec, 2);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5568 if (VECTORP (eol_type))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5569 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5570 Lisp_Object parent_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5571
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5572 if (! NILP (parent))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5573 {
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5574 Lisp_Object parent_spec;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5575
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5576 parent_spec = CODING_SYSTEM_SPEC (parent);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5577 parent_eol_type = AREF (parent_spec, 2);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5578 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5579 else
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
5580 parent_eol_type = system_eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5581 if (EQ (parent_eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5582 coding_system = AREF (eol_type, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5583 else if (EQ (parent_eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5584 coding_system = AREF (eol_type, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5585 else if (EQ (parent_eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5586 coding_system = AREF (eol_type, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5587 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5588 return coding_system;
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5589 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5590
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5591 /* Emacs has a mechanism to automatically detect a coding system if it
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5592 is one of Emacs' internal format, ISO2022, SJIS, and BIG5. But,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5593 it's impossible to distinguish some coding systems accurately
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5594 because they use the same range of codes. So, at first, coding
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5595 systems are categorized into 7, those are:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5596
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
5597 o coding-category-emacs-mule
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5598
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5599 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5600 as Emacs' internal format. Assigned the coding-system (Lisp
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
5601 symbol) `emacs-mule' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5602
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5603 o coding-category-sjis
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5604
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5605 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5606 as SJIS. Assigned the coding-system (Lisp
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5607 symbol) `japanese-shift-jis' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5608
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5609 o coding-category-iso-7
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5610
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5611 The category for a coding system which has the same code range
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5612 as ISO2022 of 7-bit environment. This doesn't use any locking
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5613 shift and single shift functions. This can encode/decode all
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5614 charsets. Assigned the coding-system (Lisp symbol)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5615 `iso-2022-7bit' by default.
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5616
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5617 o coding-category-iso-7-tight
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5618
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5619 Same as coding-category-iso-7 except that this can
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5620 encode/decode only the specified charsets.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5621
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5622 o coding-category-iso-8-1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5623
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5624 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5625 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5626 for DIMENSION1 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5627 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5628 symbol) `iso-latin-1' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5629
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5630 o coding-category-iso-8-2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5631
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5632 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5633 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5634 for DIMENSION2 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5635 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5636 symbol) `japanese-iso-8bit' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5637
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5638 o coding-category-iso-7-else
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5639
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5640 The category for a coding system which has the same code range
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5641 as ISO2022 of 7-bit environemnt but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5642 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5643 symbol) `iso-2022-7bit-lock' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5644
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5645 o coding-category-iso-8-else
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5646
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5647 The category for a coding system which has the same code range
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5648 as ISO2022 of 8-bit environemnt but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5649 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
5650 symbol) `iso-2022-8bit-ss2' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5651
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5652 o coding-category-big5
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5653
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5654 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5655 as BIG5. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5656 `cn-big5' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5657
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5658 o coding-category-utf-8
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5659
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5660 The category for a coding system which has the same code range
54303
5256a4b9366f UTF-8 is now RFC3629.
Eli Zaretskii <eliz@gnu.org>
parents: 53775
diff changeset
5661 as UTF-8 (cf. RFC3629). Assigned the coding-system (Lisp
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5662 symbol) `utf-8' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5663
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5664 o coding-category-utf-16-be
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5665
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5666 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5667 Unicode signature (cf. Unicode Standard) in the order of BIG
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5668 endian at the head. Assigned the coding-system (Lisp symbol)
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5669 `utf-16-be' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5670
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5671 o coding-category-utf-16-le
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5672
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5673 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5674 Unicode signature (cf. Unicode Standard) in the order of
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5675 LITTLE endian at the head. Assigned the coding-system (Lisp
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5676 symbol) `utf-16-le' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5677
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5678 o coding-category-ccl
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5679
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5680 The category for a coding system of which encoder/decoder is
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5681 written in CCL programs. The default value is nil, i.e., no
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5682 coding system is assigned.
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5683
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5684 o coding-category-binary
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5685
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5686 The category for a coding system not categorized in any of the
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5687 above. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5688 `no-conversion' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5689
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5690 Each of them is a Lisp symbol and the value is an actual
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5691 `coding-system's (this is also a Lisp symbol) assigned by a user.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5692 What Emacs does actually is to detect a category of coding system.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5693 Then, it uses a `coding-system' assigned to it. If Emacs can't
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5694 decide only one possible category, it selects a category of the
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5695 highest priority. Priorities of categories are also specified by a
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5696 user in a Lisp variable `coding-category-list'.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5697
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5698 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5699
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5700 #define EOL_SEEN_NONE 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5701 #define EOL_SEEN_LF 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5702 #define EOL_SEEN_CR 2
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5703 #define EOL_SEEN_CRLF 4
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5704
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5705 /* Detect how end-of-line of a text of length SRC_BYTES pointed by
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5706 SOURCE is encoded. If CATEGORY is one of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5707 coding_category_utf_16_XXXX, assume that CR and LF are encoded by
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5708 two-byte, else they are encoded by one-byte.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5709
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5710 Return one of EOL_SEEN_XXX. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5711
19173
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
5712 #define MAX_EOL_CHECK_COUNT 3
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
5713
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5714 static int
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
5715 detect_eol (source, src_bytes, category)
84646
922a7e3b7383 (detect_eol_type, detect_eol_type_in_2_octet_form):
Michaël Cadilhac <michael.cadilhac@lrde.org>
parents: 83648
diff changeset
5716 const unsigned char *source;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5717 EMACS_INT src_bytes;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
5718 enum coding_category category;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5719 {
84646
922a7e3b7383 (detect_eol_type, detect_eol_type_in_2_octet_form):
Michaël Cadilhac <michael.cadilhac@lrde.org>
parents: 83648
diff changeset
5720 const unsigned char *src = source, *src_end = src + src_bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5721 unsigned char c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5722 int total = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5723 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5724
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
5725 if ((1 << category) & CATEGORY_MASK_UTF_16)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5726 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5727 int msb, lsb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5728
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
5729 msb = category == (coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
5730 | coding_category_utf_16_le_nosig);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5731 lsb = 1 - msb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5732
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5733 while (src + 1 < src_end)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5734 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5735 c = src[lsb];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5736 if (src[msb] == 0 && (c == '\n' || c == '\r'))
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5737 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5738 int this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5739
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5740 if (c == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5741 this_eol = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5742 else if (src + 3 >= src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5743 || src[msb + 2] != 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5744 || src[lsb + 2] != '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5745 this_eol = EOL_SEEN_CR;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5746 else
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5747 this_eol = EOL_SEEN_CRLF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5748
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5749 if (eol_seen == EOL_SEEN_NONE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5750 /* This is the first end-of-line. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5751 eol_seen = this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5752 else if (eol_seen != this_eol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5753 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5754 /* The found type is different from what found before. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5755 eol_seen = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5756 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5757 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5758 if (++total == MAX_EOL_CHECK_COUNT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5759 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5760 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5761 src += 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5762 }
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
5763 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5764 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5765 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5766 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5767 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5768 c = *src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5769 if (c == '\n' || c == '\r')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5770 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5771 int this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5772
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5773 if (c == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5774 this_eol = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5775 else if (src >= src_end || *src != '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5776 this_eol = EOL_SEEN_CR;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5777 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5778 this_eol = EOL_SEEN_CRLF, src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5779
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5780 if (eol_seen == EOL_SEEN_NONE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5781 /* This is the first end-of-line. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5782 eol_seen = this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5783 else if (eol_seen != this_eol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5784 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5785 /* The found type is different from what found before. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5786 eol_seen = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5787 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5788 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5789 if (++total == MAX_EOL_CHECK_COUNT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5790 break;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5791 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5792 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5793 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5794 return eol_seen;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5795 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5796
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5797
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5798 static Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5799 adjust_coding_eol_type (coding, eol_seen)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5800 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5801 int eol_seen;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5802 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
5803 Lisp_Object eol_type;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5804
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5805 eol_type = CODING_ID_EOL_TYPE (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5806 if (eol_seen & EOL_SEEN_LF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5807 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5808 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 0));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5809 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5810 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
5811 else if (eol_seen & EOL_SEEN_CRLF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5812 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5813 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 1));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5814 eol_type = Qdos;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5815 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
5816 else if (eol_seen & EOL_SEEN_CR)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5817 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5818 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 2));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5819 eol_type = Qmac;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5820 }
19181
917138730635 (detect_eol_type): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 19173
diff changeset
5821 return eol_type;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5822 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5823
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5824 /* Detect how a text specified in CODING is encoded. If a coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5825 system is detected, update fields of CODING by the detected coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5826 system. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5827
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5828 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5829 detect_coding (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5830 struct coding_system *coding;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5831 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5832 const unsigned char *src, *src_end;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5833
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5834 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5835 coding->produced = coding->produced_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5836 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5837
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5838 src_end = coding->source + coding->src_bytes;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5839 coding->head_ascii = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5840
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5841 /* If we have not yet decided the text encoding type, detect it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5842 now. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5843 if (EQ (CODING_ATTR_TYPE (CODING_ID_ATTRS (coding->id)), Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5844 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5845 int c, i;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5846 struct coding_detection_info detect_info;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5847 int null_byte_found = 0, eight_bit_found = 0;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5848
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5849 detect_info.checked = detect_info.found = detect_info.rejected = 0;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5850 for (src = coding->source; src < src_end; src++)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
5851 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5852 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5853 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5854 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5855 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5856 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5857 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5858 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5859 else if (c < 0x20)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
5860 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5861 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5862 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5863 && ! detect_info.checked)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
5864 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5865 if (detect_coding_iso_2022 (coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5866 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5867 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5868 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5869 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5870 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5871 have found a null-byte, but it's very
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5872 rare that a binary file confirm to
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5873 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5874 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5875 coding->head_ascii = src - coding->source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5876 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5877 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5878 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5879 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5880 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5881 else if (! c)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5882 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5883 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5884 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5885 break;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
5886 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
5887 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
5888 coding->head_ascii++;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
5889 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
5890 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5891 coding->head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5892 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5893
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5894 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5895 || coding->head_ascii < coding->src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5896 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5897 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5898 enum coding_category category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5899 struct coding_system *this;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5900
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5901 if (coding->head_ascii == coding->src_bytes)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5902 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5903 for (i = 0; i < coding_category_raw_text; i++)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5904 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5905 category = coding_priorities[i];
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5906 this = coding_categories + category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5907 if (detect_info.found & (1 << category))
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5908 break;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5909 }
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5910 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5911 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5912 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5913 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5914 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5915 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5916 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5917 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5918 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5919 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5920 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5921 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5922 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5923 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5924 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5925 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5926 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5927 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5928 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5929 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5930 if (detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5931 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5932 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5933 else if ((*(this->detector)) (coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5934 && detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5935 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5936 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5937 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5938 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5939 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5940 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5941 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5942 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
5943 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5944 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5945 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
5946 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5947
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5948 if (i < coding_category_raw_text)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5949 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5950 else if (null_byte_found)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5951 setup_coding_system (Qno_conversion, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5952 else if ((detect_info.rejected & CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5953 == CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5954 setup_coding_system (Qraw_text, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5955 else if (detect_info.rejected)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5956 for (i = 0; i < coding_category_raw_text; i++)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5957 if (! (detect_info.rejected & (1 << coding_priorities[i])))
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5958 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5959 this = coding_categories + coding_priorities[i];
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5960 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5961 break;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
5962 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5963 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5964 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5965 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5966 == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5967 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5968 Lisp_Object coding_systems;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5969 struct coding_detection_info detect_info;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5970
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5971 coding_systems
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5972 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5973 detect_info.found = detect_info.rejected = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5974 coding->head_ascii = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5975 if (CONSP (coding_systems)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5976 && detect_coding_utf_8 (coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5977 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5978 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5979 setup_coding_system (XCAR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5980 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5981 setup_coding_system (XCDR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5982 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5983 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5984 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5985 == coding_category_utf_16_auto)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5986 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5987 Lisp_Object coding_systems;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5988 struct coding_detection_info detect_info;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5989
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5990 coding_systems
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5991 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5992 detect_info.found = detect_info.rejected = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5993 coding->head_ascii = 0;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5994 if (CONSP (coding_systems)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5995 && detect_coding_utf_16 (coding, &detect_info))
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5996 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5997 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5998 setup_coding_system (XCAR (coding_systems), coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5999 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6000 setup_coding_system (XCDR (coding_systems), coding);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6001 }
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6002 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6003 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6004
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6005
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6006 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6007 decode_eol (coding)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6008 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6009 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6010 Lisp_Object eol_type;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6011 unsigned char *p, *pbeg, *pend;
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
6012
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6013 eol_type = CODING_ID_EOL_TYPE (coding->id);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6014 if (EQ (eol_type, Qunix))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6015 return;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6016
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6017 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6018 pbeg = coding->destination;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6019 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6020 pbeg = BYTE_POS_ADDR (coding->dst_pos_byte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6021 pend = pbeg + coding->produced;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6022
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6023 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6024 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6025 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6026
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6027 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6028 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6029 if (*p == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6030 eol_seen |= EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6031 else if (*p == '\r')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6032 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6033 if (p + 1 < pend && *(p + 1) == '\n')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6034 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6035 eol_seen |= EOL_SEEN_CRLF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6036 p++;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6037 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6038 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6039 eol_seen |= EOL_SEEN_CR;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6040 }
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6041 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6042 if (eol_seen != EOL_SEEN_NONE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6043 && eol_seen != EOL_SEEN_LF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6044 && eol_seen != EOL_SEEN_CRLF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6045 && eol_seen != EOL_SEEN_CR)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6046 eol_seen = EOL_SEEN_LF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6047 if (eol_seen != EOL_SEEN_NONE)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6048 eol_type = adjust_coding_eol_type (coding, eol_seen);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6049 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6050
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6051 if (EQ (eol_type, Qmac))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6052 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6053 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6054 if (*p == '\r')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6055 *p = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6056 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6057 else if (EQ (eol_type, Qdos))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6058 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6059 int n = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6060
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6061 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6062 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6063 /* Start deleting '\r' from the tail to minimize the memory
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6064 movement. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6065 for (p = pend - 2; p >= pbeg; p--)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6066 if (*p == '\r')
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6067 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6068 safe_bcopy ((char *) (p + 1), (char *) p, pend-- - p - 1);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6069 n++;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6070 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6071 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6072 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6073 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6074 int pos_byte = coding->dst_pos_byte;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6075 int pos = coding->dst_pos;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6076 int pos_end = pos + coding->produced_char - 1;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6077
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6078 while (pos < pos_end)
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6079 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6080 p = BYTE_POS_ADDR (pos_byte);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6081 if (*p == '\r' && p[1] == '\n')
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6082 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6083 del_range_2 (pos, pos_byte, pos + 1, pos_byte + 1, 0);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6084 n++;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6085 pos_end--;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6086 }
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6087 pos++;
91535
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6088 if (coding->dst_multibyte)
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6089 pos_byte += BYTES_BY_CHAR_HEAD (*p);
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6090 else
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6091 pos_byte++;
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6092 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6093 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6094 coding->produced -= n;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6095 coding->produced_char -= n;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6096 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6097 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6098
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6099
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6100 /* Return a translation table (or list of them) from coding system
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6101 attribute vector ATTRS for encoding (ENCODEP is nonzero) or
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6102 decoding (ENCODEP is zero). */
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6103
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6104 static Lisp_Object
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6105 get_translation_table (attrs, encodep, max_lookup)
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6106 Lisp_Object attrs;
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6107 int encodep, *max_lookup;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6108 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6109 Lisp_Object standard, translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6110 Lisp_Object val;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6111
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6112 if (encodep)
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6113 translation_table = CODING_ATTR_ENCODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6114 standard = Vstandard_translation_table_for_encode;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6115 else
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6116 translation_table = CODING_ATTR_DECODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6117 standard = Vstandard_translation_table_for_decode;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6118 if (NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6119 translation_table = standard;
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6120 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6121 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6122 if (SYMBOLP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6123 translation_table = Fget (translation_table, Qtranslation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6124 else if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6125 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6126 translation_table = Fcopy_sequence (translation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6127 for (val = translation_table; CONSP (val); val = XCDR (val))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6128 if (SYMBOLP (XCAR (val)))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6129 XSETCAR (val, Fget (XCAR (val), Qtranslation_table));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6130 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6131 if (CHAR_TABLE_P (standard))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6132 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6133 if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6134 translation_table = nconc2 (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6135 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6136 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6137 translation_table = Fcons (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6138 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6139 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6140 }
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6141
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6142 if (max_lookup)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6143 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6144 *max_lookup = 1;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6145 if (CHAR_TABLE_P (translation_table)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6146 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (translation_table)) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6147 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6148 val = XCHAR_TABLE (translation_table)->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6149 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6150 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6151 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6152 else if (CONSP (translation_table))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6153 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6154 Lisp_Object tail, val;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6155
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6156 for (tail = translation_table; CONSP (tail); tail = XCDR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6157 if (CHAR_TABLE_P (XCAR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6158 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (XCAR (tail))) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6159 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6160 val = XCHAR_TABLE (XCAR (tail))->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6161 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6162 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6163 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6164 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6165 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6166 return translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6167 }
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6168
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6169 #define LOOKUP_TRANSLATION_TABLE(table, c, trans) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6170 do { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6171 trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6172 if (CHAR_TABLE_P (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6173 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6174 trans = CHAR_TABLE_REF (table, c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6175 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6176 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6177 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6178 else if (CONSP (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6179 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6180 Lisp_Object tail; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6181 \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6182 for (tail = table; CONSP (tail); tail = XCDR (tail)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6183 if (CHAR_TABLE_P (XCAR (tail))) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6184 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6185 trans = CHAR_TABLE_REF (XCAR (tail), c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6186 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6187 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6188 else if (! NILP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6189 break; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6190 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6191 } \
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6192 } while (0)
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6193
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6194
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6195 static Lisp_Object
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6196 get_translation (val, buf, buf_end, last_block, from_nchars, to_nchars)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6197 Lisp_Object val;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6198 int *buf, *buf_end;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6199 int last_block;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6200 int *from_nchars, *to_nchars;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6201 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6202 /* VAL is TO or (([FROM-CHAR ...] . TO) ...) where TO is TO-CHAR or
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6203 [TO-CHAR ...]. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6204 if (CONSP (val))
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6205 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6206 Lisp_Object from, tail;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6207 int i, len;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6208
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6209 for (tail = val; CONSP (tail); tail = XCDR (tail))
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6210 {
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6211 val = XCAR (tail);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6212 from = XCAR (val);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6213 len = ASIZE (from);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6214 for (i = 0; i < len; i++)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6215 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6216 if (buf + i == buf_end)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6217 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6218 if (! last_block)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6219 return Qt;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6220 break;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6221 }
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6222 if (XINT (AREF (from, i)) != buf[i])
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6223 break;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6224 }
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6225 if (i == len)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6226 {
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6227 val = XCDR (val);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6228 *from_nchars = len;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6229 break;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6230 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6231 }
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6232 if (! CONSP (tail))
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6233 return Qnil;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6234 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6235 if (VECTORP (val))
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6236 *buf = XINT (AREF (val, 0)), *to_nchars = ASIZE (val);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6237 else
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6238 *buf = XINT (val);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6239 return val;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6240 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6241
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6242
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6243 static int
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6244 produce_chars (coding, translation_table, last_block)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6245 struct coding_system *coding;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6246 Lisp_Object translation_table;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6247 int last_block;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6248 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6249 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6250 unsigned char *dst_end = coding->destination + coding->dst_bytes;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6251 EMACS_INT produced;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6252 EMACS_INT produced_chars = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6253 int carryover = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6254
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6255 if (! coding->chars_at_source)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6256 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6257 /* Source characters are in coding->charbuf. */
89575
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6258 int *buf = coding->charbuf;
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6259 int *buf_end = buf + coding->charbuf_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6260
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6261 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6262 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6263 coding_set_source (coding);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6264 dst_end = ((unsigned char *) coding->source) + coding->consumed;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6265 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6266
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6267 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6268 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6269 int c = *buf, i;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6270
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6271 if (c >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6272 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6273 int from_nchars = 1, to_nchars = 1;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6274 Lisp_Object trans = Qnil;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6275
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6276 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6277 if (! NILP (trans))
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6278 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6279 trans = get_translation (trans, buf, buf_end, last_block,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6280 &from_nchars, &to_nchars);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6281 if (EQ (trans, Qt))
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6282 break;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6283 c = *buf;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6284 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6285
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6286 if (dst + MAX_MULTIBYTE_LENGTH * to_nchars > dst_end)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6287 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6288 dst = alloc_destination (coding,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6289 buf_end - buf
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6290 + MAX_MULTIBYTE_LENGTH * to_nchars,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6291 dst);
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6292 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6293 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6294 coding_set_source (coding);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6295 dst_end = ((unsigned char *) coding->source) + coding->consumed;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6296 }
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6297 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6298 dst_end = coding->destination + coding->dst_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6299 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6300
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6301 for (i = 0; i < to_nchars; i++)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6302 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6303 if (i > 0)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6304 c = XINT (AREF (trans, i));
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6305 if (coding->dst_multibyte
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6306 || ! CHAR_BYTE8_P (c))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6307 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6308 else
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6309 *dst++ = CHAR_TO_BYTE8 (c);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6310 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6311 produced_chars += to_nchars;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6312 *buf++ = to_nchars;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6313 while (--from_nchars > 0)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6314 *buf++ = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6315 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6316 else
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6317 /* This is an annotation datum. (-C) is the length. */
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6318 buf += -c;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6319 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6320 carryover = buf_end - buf;
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6321 }
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6322 else
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6323 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6324 /* Source characters are at coding->source. */
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6325 const unsigned char *src = coding->source;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6326 const unsigned char *src_end = src + coding->consumed;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6327
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6328 if (EQ (coding->dst_object, coding->src_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6329 dst_end = (unsigned char *) src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6330 if (coding->src_multibyte != coding->dst_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6331 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6332 if (coding->src_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6333 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6334 int multibytep = 1;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
6335 EMACS_INT consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6336
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6337 while (1)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6338 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6339 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6340 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6341
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6342 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6343 if (dst == dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6344 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6345 if (EQ (coding->src_object, coding->dst_object))
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6346 dst_end = (unsigned char *) src;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6347 if (dst == dst_end)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6348 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6349 EMACS_INT offset = src - coding->source;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6350
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6351 dst = alloc_destination (coding, src_end - src + 1,
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6352 dst);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6353 dst_end = coding->destination + coding->dst_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6354 coding_set_source (coding);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6355 src = coding->source + offset;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6356 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6357 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6358 dst_end = (unsigned char *) src;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6359 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6360 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6361 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6362 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6363 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6364 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6365 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6366 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6367 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6368 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6369 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6370 int multibytep = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6371 int c = *src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6372
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6373 if (dst >= dst_end - 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6374 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6375 if (EQ (coding->src_object, coding->dst_object))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6376 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6377 if (dst >= dst_end - 1)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6378 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6379 EMACS_INT offset = src - coding->source;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6380 EMACS_INT more_bytes;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6381
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6382 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6383 more_bytes = ((src_end - src) / 2) + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6384 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6385 more_bytes = src_end - src + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6386 dst = alloc_destination (coding, more_bytes, dst);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6387 dst_end = coding->destination + coding->dst_bytes;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6388 coding_set_source (coding);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6389 src = coding->source + offset;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6390 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6391 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6392 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6393 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6394 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6395 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6396 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6397 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6398 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6399 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6400 if (!EQ (coding->src_object, coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6401 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6402 EMACS_INT require = coding->src_bytes - coding->dst_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6403
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6404 if (require > 0)
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6405 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6406 EMACS_INT offset = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6407
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6408 dst = alloc_destination (coding, require, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6409 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6410 src = coding->source + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6411 src_end = coding->source + coding->src_bytes;
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6412 }
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6413 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6414 produced_chars = coding->consumed_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6415 while (src < src_end)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
6416 *dst++ = *src++;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6417 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6418 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6419
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6420 produced = dst - (coding->destination + coding->produced);
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
6421 if (BUFFERP (coding->dst_object) && produced_chars > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6422 insert_from_gap (produced_chars, produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6423 coding->produced += produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6424 coding->produced_char += produced_chars;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6425 return carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6426 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6427
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6428 /* Compose text in CODING->object according to the annotation data at
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6429 CHARBUF. CHARBUF is an array:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6430 [ -LENGTH ANNOTATION_MASK FROM TO METHOD COMP_LEN [ COMPONENTS... ] ]
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6431 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6432
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6433 static INLINE void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6434 produce_composition (coding, charbuf, pos)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6435 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6436 int *charbuf;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6437 EMACS_INT pos;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6438 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6439 int len;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6440 EMACS_INT to;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6441 enum composition_method method;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6442 Lisp_Object components;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6443
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6444 len = -charbuf[0];
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6445 to = pos + charbuf[2];
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6446 if (to <= pos)
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6447 return;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6448 method = (enum composition_method) (charbuf[3]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6449
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6450 if (method == COMPOSITION_RELATIVE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6451 components = Qnil;
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6452 else if (method >= COMPOSITION_WITH_RULE
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6453 && method <= COMPOSITION_WITH_RULE_ALTCHARS)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6454 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6455 Lisp_Object args[MAX_COMPOSITION_COMPONENTS * 2 - 1];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6456 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6457
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6458 len -= 4;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6459 charbuf += 4;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6460 for (i = 0; i < len; i++)
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6461 {
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6462 args[i] = make_number (charbuf[i]);
90359
041f75914d0c (produce_composition): Compare charbuf[i] instead of
Kenichi Handa <handa@m17n.org>
parents: 90354
diff changeset
6463 if (charbuf[i] < 0)
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6464 return;
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6465 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6466 components = (method == COMPOSITION_WITH_ALTCHARS
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6467 ? Fstring (len, args) : Fvector (len, args));
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6468 }
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6469 else
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
6470 return;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6471 compose_text (pos, to, components, Qnil, coding->dst_object);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6472 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6473
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6474
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6475 /* Put `charset' property on text in CODING->object according to
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6476 the annotation data at CHARBUF. CHARBUF is an array:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6477 [ -LENGTH ANNOTATION_MASK NCHARS CHARSET-ID ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6478 */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6479
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6480 static INLINE void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6481 produce_charset (coding, charbuf, pos)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6482 struct coding_system *coding;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6483 int *charbuf;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6484 EMACS_INT pos;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6485 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6486 EMACS_INT from = pos - charbuf[2];
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6487 struct charset *charset = CHARSET_FROM_ID (charbuf[3]);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6488
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6489 Fput_text_property (make_number (from), make_number (pos),
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6490 Qcharset, CHARSET_NAME (charset),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6491 coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6492 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6493
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6494
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6495 #define CHARBUF_SIZE 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6496
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6497 #define ALLOC_CONVERSION_WORK_AREA(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6498 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6499 int size = CHARBUF_SIZE;; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6500 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6501 coding->charbuf = NULL; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6502 while (size > 1024) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6503 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6504 coding->charbuf = (int *) alloca (sizeof (int) * size); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6505 if (coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6506 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6507 size >>= 1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6508 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6509 if (! coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6510 { \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
6511 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_MEM); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6512 return coding->result; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6513 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6514 coding->charbuf_size = size; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6515 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6516
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6517
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6518 static void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6519 produce_annotation (coding, pos)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6520 struct coding_system *coding;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6521 EMACS_INT pos;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6522 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6523 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6524 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6525
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6526 if (NILP (coding->dst_object))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6527 return;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6528
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6529 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6530 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6531 if (*charbuf >= 0)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6532 pos += *charbuf++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6533 else
29877
7b43e1fb478a (decode_eol_post_ccl): Special handling for undecided
Eli Zaretskii <eliz@gnu.org>
parents: 29725
diff changeset
6534 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6535 int len = -*charbuf;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6536 switch (charbuf[1])
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6537 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6538 case CODING_ANNOTATE_COMPOSITION_MASK:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6539 produce_composition (coding, charbuf, pos);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6540 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6541 case CODING_ANNOTATE_CHARSET_MASK:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6542 produce_charset (coding, charbuf, pos);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6543 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6544 default:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6545 abort ();
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6546 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6547 charbuf += len;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6548 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6549 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6550 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6551
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6552 /* Decode the data at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6553 CODING->src_object is a buffer, a string, or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6554 CODING->dst_object is a buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6555
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6556 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6557 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6558 the source text in the buffer, otherwise, the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6559 gap area of the buffer, and CODING->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6560 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6561 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6562 negative.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6563
90380
4bf7966e0788 (decode_coding): Typo in comment fixed.
Kenichi Handa <handa@m17n.org>
parents: 90378
diff changeset
6564 If CODING->src_object is a string, CODING->src_pos is an index to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6565 that string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6566
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6567 If CODING->src_object is nil, CODING->source must already point to
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6568 the non-relocatable memory area. In this case, CODING->src_pos is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6569 an offset from CODING->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6570
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6571 The decoded data is inserted at the current point of the buffer
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6572 CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6573 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6574
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6575 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6576 decode_coding (coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6577 struct coding_system *coding;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6578 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6579 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6580 Lisp_Object undo_list;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6581 Lisp_Object translation_table;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6582 int carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6583 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6584
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6585 if (BUFFERP (coding->src_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6586 && coding->src_pos > 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6587 && coding->src_pos < GPT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6588 && coding->src_pos + coding->src_chars > GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6589 move_gap_both (coding->src_pos, coding->src_pos_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6590
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6591 undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6592 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6593 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6594 if (current_buffer != XBUFFER (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6595 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6596 if (GPT != PT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6597 move_gap_both (PT, PT_BYTE);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6598 undo_list = current_buffer->undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6599 current_buffer->undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6600 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6601
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6602 coding->consumed = coding->consumed_char = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
6603 coding->produced = coding->produced_char = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6604 coding->chars_at_source = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
6605 record_conversion_result (coding, CODING_RESULT_SUCCESS);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
6606 coding->errors = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6607
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6608 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6609
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6610 attrs = CODING_ID_ATTRS (coding->id);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6611 translation_table = get_translation_table (attrs, 0, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6612
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6613 carryover = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6614 do
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6615 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6616 EMACS_INT pos = coding->dst_pos + coding->produced_char;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6617
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6618 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6619 coding->annotated = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6620 coding->charbuf_used = carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6621 (*(coding->decoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6622 coding_set_destination (coding);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6623 carryover = produce_chars (coding, translation_table, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6624 if (coding->annotated)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6625 produce_annotation (coding, pos);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6626 for (i = 0; i < carryover; i++)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6627 coding->charbuf[i]
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6628 = coding->charbuf[coding->charbuf_used - carryover + i];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6629 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6630 while (coding->consumed < coding->src_bytes
90336
f0338dbf2276 (decode_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 90327
diff changeset
6631 && (coding->result == CODING_RESULT_SUCCESS
f0338dbf2276 (decode_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 90327
diff changeset
6632 || coding->result == CODING_RESULT_INVALID_SRC));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6633
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6634 if (carryover > 0)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6635 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6636 coding_set_destination (coding);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6637 coding->charbuf_used = carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6638 produce_chars (coding, translation_table, 1);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6639 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6640
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6641 coding->carryover_bytes = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6642 if (coding->consumed < coding->src_bytes)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6643 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6644 int nbytes = coding->src_bytes - coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6645 const unsigned char *src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6646
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6647 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6648 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6649 src = coding->source + coding->consumed;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6650
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6651 if (coding->mode & CODING_MODE_LAST_BLOCK)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6652 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6653 /* Flush out unprocessed data as binary chars. We are sure
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6654 that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6655 coding->charbuf. */
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
6656 coding->charbuf_used = 0;
100587
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
6657 coding->chars_at_source = 0;
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
6658
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6659 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6660 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6661 int c = *src++;
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
6662
90243
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
6663 if (c & 0x80)
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
6664 c = BYTE8_TO_CHAR (c);
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
6665 coding->charbuf[coding->charbuf_used++] = c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6666 }
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
6667 produce_chars (coding, Qnil, 1);
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6668 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6669 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6670 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6671 /* Record unprocessed bytes in coding->carryover. We are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6672 sure that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6673 coding->carryover. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6674 unsigned char *p = coding->carryover;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6675
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6676 coding->carryover_bytes = nbytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6677 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6678 *p++ = *src++;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6679 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6680 coding->consumed = coding->src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6681 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6682
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6683 if (! EQ (CODING_ID_EOL_TYPE (coding->id), Qunix))
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6684 decode_eol (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6685 if (BUFFERP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6686 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6687 current_buffer->undo_list = undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6688 record_insert (coding->dst_pos, coding->produced_char);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6689 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
6690 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6691 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6692
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6693
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
6694 /* Extract an annotation datum from a composition starting at POS and
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6695 ending before LIMIT of CODING->src_object (buffer or string), store
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6696 the data in BUF, set *STOP to a starting position of the next
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6697 composition (if any) or to LIMIT, and return the address of the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6698 next element of BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6699
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6700 If such an annotation is not found, set *STOP to a starting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6701 position of a composition after POS (if any) or to LIMIT, and
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6702 return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6703
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6704 static INLINE int *
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6705 handle_composition_annotation (pos, limit, coding, buf, stop)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6706 EMACS_INT pos, limit;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6707 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6708 int *buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6709 EMACS_INT *stop;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6710 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6711 EMACS_INT start, end;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6712 Lisp_Object prop;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6713
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6714 if (! find_composition (pos, limit, &start, &end, &prop, coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6715 || end > limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6716 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6717 else if (start > pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6718 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6719 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6720 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6721 if (start == pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6722 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6723 /* We found a composition. Store the corresponding
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6724 annotation data in BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6725 int *head = buf;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6726 enum composition_method method = COMPOSITION_METHOD (prop);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6727 int nchars = COMPOSITION_LENGTH (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6728
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6729 ADD_COMPOSITION_DATA (buf, nchars, method);
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6730 if (method != COMPOSITION_RELATIVE)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6731 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6732 Lisp_Object components;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6733 int len, i, i_byte;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6734
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6735 components = COMPOSITION_COMPONENTS (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6736 if (VECTORP (components))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6737 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6738 len = XVECTOR (components)->size;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6739 for (i = 0; i < len; i++)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6740 *buf++ = XINT (AREF (components, i));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6741 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6742 else if (STRINGP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6743 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6744 len = SCHARS (components);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6745 i = i_byte = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6746 while (i < len)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6747 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6748 FETCH_STRING_CHAR_ADVANCE (*buf, components, i, i_byte);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6749 buf++;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6750 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6751 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6752 else if (INTEGERP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6753 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6754 len = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6755 *buf++ = XINT (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6756 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6757 else if (CONSP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6758 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6759 for (len = 0; CONSP (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6760 len++, components = XCDR (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6761 *buf++ = XINT (XCAR (components));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6762 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6763 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6764 abort ();
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6765 *head -= len;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6766 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6767 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6768
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6769 if (find_composition (end, limit, &start, &end, &prop,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6770 coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6771 && end <= limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6772 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6773 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6774 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6775 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6776 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6777 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6778
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6779
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
6780 /* Extract an annotation datum from a text property `charset' at POS of
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6781 CODING->src_object (buffer of string), store the data in BUF, set
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6782 *STOP to the position where the value of `charset' property changes
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6783 (limiting by LIMIT), and return the address of the next element of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6784 BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6785
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6786 If the property value is nil, set *STOP to the position where the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6787 property value is non-nil (limiting by LIMIT), and return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6788
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6789 static INLINE int *
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6790 handle_charset_annotation (pos, limit, coding, buf, stop)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6791 EMACS_INT pos, limit;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6792 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6793 int *buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6794 EMACS_INT *stop;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6795 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6796 Lisp_Object val, next;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6797 int id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6798
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6799 val = Fget_text_property (make_number (pos), Qcharset, coding->src_object);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6800 if (! NILP (val) && CHARSETP (val))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6801 id = XINT (CHARSET_SYMBOL_ID (val));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6802 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6803 id = -1;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6804 ADD_CHARSET_DATA (buf, 0, id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6805 next = Fnext_single_property_change (make_number (pos), Qcharset,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6806 coding->src_object,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6807 make_number (limit));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6808 *stop = XINT (next);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6809 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6810 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6811
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6812
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6813 static void
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6814 consume_chars (coding, translation_table, max_lookup)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6815 struct coding_system *coding;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6816 Lisp_Object translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6817 int max_lookup;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6818 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6819 int *buf = coding->charbuf;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6820 int *buf_end = coding->charbuf + coding->charbuf_size;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
6821 const unsigned char *src = coding->source + coding->consumed;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
6822 const unsigned char *src_end = coding->source + coding->src_bytes;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6823 EMACS_INT pos = coding->src_pos + coding->consumed_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6824 EMACS_INT end_pos = coding->src_pos + coding->src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6825 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6826 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6827 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6828 EMACS_INT stop, stop_composition, stop_charset;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6829 int *lookup_buf = NULL;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6830
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6831 if (! NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6832 lookup_buf = alloca (sizeof (int) * max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6833
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6834 eol_type = CODING_ID_EOL_TYPE (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6835 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6836 eol_type = Qunix;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6837
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6838 /* Note: composition handling is not yet implemented. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6839 coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6840
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6841 if (NILP (coding->src_object))
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6842 stop = stop_composition = stop_charset = end_pos;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6843 else
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6844 {
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6845 if (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6846 stop = stop_composition = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6847 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6848 stop = stop_composition = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6849 if (coding->common_flags & CODING_ANNOTATE_CHARSET_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6850 stop = stop_charset = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6851 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6852 stop_charset = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
6853 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6854
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6855 /* Compensate for CRLF and conversion. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6856 buf_end -= 1 + MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6857 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6858 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6859 Lisp_Object trans;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6860
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6861 if (pos == stop)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6862 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6863 if (pos == end_pos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6864 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6865 if (pos == stop_composition)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6866 buf = handle_composition_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6867 buf, &stop_composition);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6868 if (pos == stop_charset)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6869 buf = handle_charset_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6870 buf, &stop_charset);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6871 stop = (stop_composition < stop_charset
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6872 ? stop_composition : stop_charset);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6873 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6874
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6875 if (! multibytep)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
6876 {
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6877 EMACS_INT bytes;
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6878
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6879 if (coding->encoder == encode_coding_raw_text)
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6880 c = *src++, pos++;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6881 else if ((bytes = MULTIBYTE_LENGTH (src, src_end)) > 0)
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6882 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos += bytes;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
6883 else
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
6884 c = BYTE8_TO_CHAR (*src), src++, pos++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
6885 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6886 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6887 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6888 if ((c == '\r') && (coding->mode & CODING_MODE_SELECTIVE_DISPLAY))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6889 c = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6890 if (! EQ (eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6891 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6892 if (c == '\n')
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
6893 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6894 if (EQ (eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6895 *buf++ = '\r';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6896 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6897 c = '\r';
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
6898 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6899 }
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6900
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6901 trans = Qnil;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6902 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6903 if (NILP (trans))
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6904 *buf++ = c;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6905 else
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6906 {
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6907 int from_nchars = 1, to_nchars = 1;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6908 int *lookup_buf_end;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6909 const unsigned char *p = src;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6910 int i;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6911
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6912 lookup_buf[0] = c;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6913 for (i = 1; i < max_lookup && p < src_end; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6914 lookup_buf[i] = STRING_CHAR_ADVANCE (p);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6915 lookup_buf_end = lookup_buf + i;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6916 trans = get_translation (trans, lookup_buf, lookup_buf_end, 1,
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6917 &from_nchars, &to_nchars);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6918 if (EQ (trans, Qt)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6919 || buf + to_nchars > buf_end)
23881
20d595402dea (DECODE_DESIGNATION): Jump to label_invalid_code if
Kenichi Handa <handa@m17n.org>
parents: 23564
diff changeset
6920 break;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6921 *buf++ = *lookup_buf;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6922 for (i = 1; i < to_nchars; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6923 *buf++ = XINT (AREF (trans, i));
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6924 for (i = 1; i < from_nchars; i++, pos++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6925 src += MULTIBYTE_LENGTH_NO_CHECK (src);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6926 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6927 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6928
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6929 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6930 coding->consumed_char = pos - coding->src_pos;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6931 coding->charbuf_used = buf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6932 coding->chars_at_source = 0;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6933 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6934
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6935
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6936 /* Encode the text at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6937 CODING->src_object is a buffer or a string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6938 CODING->dst_object is a buffer or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6939
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6940 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6941 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6942 the source text in the buffer, otherwise. the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6943 gap area of the buffer, and coding->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6944 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6945 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6946 negative and CODING should not have `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6947
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6948 If CODING->src_object is a string, CODING should not have
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6949 `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6950
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6951 If CODING->dst_object is a buffer, the encoded data is inserted at
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6952 the current point of that buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6953
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6954 If CODING->dst_object is nil, the encoded data is placed at the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6955 memory area specified by CODING->destination. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6956
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6957 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6958 encode_coding (coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6959 struct coding_system *coding;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6960 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6961 Lisp_Object attrs;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6962 Lisp_Object translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6963 int max_lookup;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6964
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6965 attrs = CODING_ID_ATTRS (coding->id);
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6966 if (coding->encoder == encode_coding_raw_text)
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6967 translation_table = Qnil, max_lookup = 0;
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
6968 else
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
6969 translation_table = get_translation_table (attrs, 1, &max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6970
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6971 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6972 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6973 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6974 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6975 = ! NILP (current_buffer->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6976 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6977
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6978 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6979 coding->produced = coding->produced_char = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
6980 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6981 coding->errors = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6982
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6983 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6984
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6985 do {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6986 coding_set_source (coding);
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6987 consume_chars (coding, translation_table, max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6988 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6989 (*(coding->encoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6990 } while (coding->consumed_char < coding->src_chars);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6991
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
6992 if (BUFFERP (coding->dst_object) && coding->produced_char > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6993 insert_from_gap (coding->produced_char, coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6994
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6995 return (coding->result);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6996 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6997
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
6998
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6999 /* Name (or base name) of work buffer for code conversion. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7000 static Lisp_Object Vcode_conversion_workbuf_name;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7001
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7002 /* A working buffer used by the top level conversion. Once it is
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7003 created, it is never destroyed. It has the name
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7004 Vcode_conversion_workbuf_name. The other working buffers are
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7005 destroyed after the use is finished, and their names are modified
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7006 versions of Vcode_conversion_workbuf_name. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7007 static Lisp_Object Vcode_conversion_reused_workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7008
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7009 /* 1 iff Vcode_conversion_reused_workbuf is already in use. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7010 static int reused_workbuf_in_use;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7011
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7012
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7013 /* Return a working buffer of code convesion. MULTIBYTE specifies the
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7014 multibyteness of returning buffer. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7015
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7016 static Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7017 make_conversion_work_buffer (multibyte)
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7018 int multibyte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7019 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7020 Lisp_Object name, workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7021 struct buffer *current;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7022
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7023 if (reused_workbuf_in_use++)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7024 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7025 name = Fgenerate_new_buffer_name (Vcode_conversion_workbuf_name, Qnil);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7026 workbuf = Fget_buffer_create (name);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7027 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7028 else
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7029 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
7030 if (NILP (Fbuffer_live_p (Vcode_conversion_reused_workbuf)))
98186
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7031 Vcode_conversion_reused_workbuf
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7032 = Fget_buffer_create (Vcode_conversion_workbuf_name);
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7033 workbuf = Vcode_conversion_reused_workbuf;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7034 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7035 current = current_buffer;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7036 set_buffer_internal (XBUFFER (workbuf));
100262
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7037 /* We can't allow modification hooks to run in the work buffer. For
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7038 instance, directory_files_internal assumes that file decoding
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7039 doesn't compile new regexps. */
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7040 Fset (Fmake_local_variable (Qinhibit_modification_hooks), Qt);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
7041 Ferase_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7042 current_buffer->undo_list = Qt;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7043 current_buffer->enable_multibyte_characters = multibyte ? Qt : Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7044 set_buffer_internal (current);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7045 return workbuf;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7046 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7047
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7048
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7049 static Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7050 code_conversion_restore (arg)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7051 Lisp_Object arg;
26067
f54ca66e2571 (code_convert_string): Add record_unwind_protect to
Kenichi Handa <handa@m17n.org>
parents: 25860
diff changeset
7052 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7053 Lisp_Object current, workbuf;
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7054 struct gcpro gcpro1;
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7055
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7056 GCPRO1 (arg);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7057 current = XCAR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7058 workbuf = XCDR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7059 if (! NILP (workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7060 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7061 if (EQ (workbuf, Vcode_conversion_reused_workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7062 reused_workbuf_in_use = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7063 else if (! NILP (Fbuffer_live_p (workbuf)))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7064 Fkill_buffer (workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7065 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7066 set_buffer_internal (XBUFFER (current));
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7067 UNGCPRO;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7068 return Qnil;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7069 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7070
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7071 Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7072 code_conversion_save (with_work_buf, multibyte)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7073 int with_work_buf, multibyte;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7074 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7075 Lisp_Object workbuf = Qnil;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7076
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7077 if (with_work_buf)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7078 workbuf = make_conversion_work_buffer (multibyte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7079 record_unwind_protect (code_conversion_restore,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7080 Fcons (Fcurrent_buffer (), workbuf));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7081 return workbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7082 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7083
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7084 int
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7085 decode_coding_gap (coding, chars, bytes)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7086 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7087 EMACS_INT chars, bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7088 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7089 int count = specpdl_ptr - specpdl;
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7090 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7091
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7092 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7093
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7094 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7095 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7096 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7097 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7098 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7099 coding->src_multibyte = chars < bytes;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7100 coding->dst_object = coding->src_object;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7101 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7102 coding->dst_pos_byte = PT_BYTE;
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
7103 coding->dst_multibyte = ! NILP (current_buffer->enable_multibyte_characters);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7104
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7105 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7106 detect_coding (coding);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7107
90350
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
7108 coding->mode |= CODING_MODE_LAST_BLOCK;
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7109 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7110 decode_coding (coding);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7111 current_buffer->text->inhibit_shrinking = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7112
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7113 attrs = CODING_ID_ATTRS (coding->id);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7114 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7115 {
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7116 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7117 Lisp_Object val;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7118
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7119 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7120 val = call1 (CODING_ATTR_POST_READ (attrs),
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7121 make_number (coding->produced_char));
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7122 CHECK_NATNUM (val);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7123 coding->produced_char += Z - prev_Z;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7124 coding->produced += Z_BYTE - prev_Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7125 }
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7126
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7127 unbind_to (count, Qnil);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7128 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7129 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7130
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7131 int
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7132 encode_coding_gap (coding, chars, bytes)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7133 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7134 EMACS_INT chars, bytes;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7135 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7136 int count = specpdl_ptr - specpdl;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7137
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7138 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7139
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7140 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7141 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7142 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7143 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7144 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7145 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7146 coding->dst_object = coding->src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7147 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7148 coding->dst_pos_byte = PT_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7149
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7150 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7151
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7152 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7153 return coding->result;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7154 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7155
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7156
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7157 /* Decode the text in the range FROM/FROM_BYTE and TO/TO_BYTE in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7158 SRC_OBJECT into DST_OBJECT by coding context CODING.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7159
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7160 SRC_OBJECT is a buffer, a string, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7161
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7162 If it is a buffer, the text is at point of the buffer. FROM and TO
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7163 are positions in the buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7164
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7165 If it is a string, the text is at the beginning of the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7166 FROM and TO are indices to the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7167
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7168 If it is nil, the text is at coding->source. FROM and TO are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7169 indices to coding->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7170
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7171 DST_OBJECT is a buffer, Qt, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7172
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7173 If it is a buffer, the decoded text is inserted at point of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7174 buffer. If the buffer is the same as SRC_OBJECT, the source text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7175 is deleted.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7176
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7177 If it is Qt, a string is made from the decoded text, and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7178 set in CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7179
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7180 If it is Qnil, the decoded text is stored at CODING->destination.
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7181 The caller must allocate CODING->dst_bytes bytes at
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7182 CODING->destination by xmalloc. If the decoded text is longer than
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7183 CODING->dst_bytes, CODING->destination is relocated by xrealloc.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7184 */
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7185
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7186 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7187 decode_coding_object (coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7188 dst_object)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7189 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7190 Lisp_Object src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7191 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7192 Lisp_Object dst_object;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7193 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7194 int count = specpdl_ptr - specpdl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7195 unsigned char *destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7196 EMACS_INT dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7197 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7198 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7199 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7200 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7201 int need_marker_adjustment = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7202 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7203
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7204 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7205
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7206 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7207 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7208 destination = coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7209 dst_bytes = coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7210 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7211
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7212 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7213 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7214 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7215 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7216
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7217 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7218 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7219 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7220 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7221 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7222 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7223 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7224 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7225 if (from != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7226 move_gap_both (from, from_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7227 if (EQ (src_object, dst_object))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7228 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7229 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7230
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7231 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7232 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7233 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7234 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7235 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7236 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7237 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7238 TEMP_SET_PT_BOTH (from, from_byte);
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7239 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7240 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7241 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7242 coding->src_pos_byte = -bytes;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
7243 }
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7244 else
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7245 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7246 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7247 coding->src_pos_byte = from_byte;
29985
c17e78d8c720 (code_convert_region): Even if the length of text is
Kenichi Handa <handa@m17n.org>
parents: 29932
diff changeset
7248 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7249 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7250
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7251 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7252 detect_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7253 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7254
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7255 if (EQ (dst_object, Qt)
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7256 || (! NILP (CODING_ATTR_POST_READ (attrs))
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7257 && NILP (dst_object)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7258 {
93321
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7259 coding->dst_multibyte = !CODING_FOR_UNIBYTE (coding);
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7260 coding->dst_object = code_conversion_save (1, coding->dst_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7261 coding->dst_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7262 coding->dst_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7263 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7264 else if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7265 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7266 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7267 coding->dst_object = dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7268 coding->dst_pos = BUF_PT (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7269 coding->dst_pos_byte = BUF_PT_BYTE (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7270 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7271 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7272 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7273 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
7274 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7275 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7276 coding->dst_object = Qnil;
93322
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7277 /* Most callers presume this will return a multibyte result, and they
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7278 won't use `binary' or `raw-text' anyway, so let's not worry about
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7279 CODING_FOR_UNIBYTE. */
93323
06e93ffa2e9f (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93322
diff changeset
7280 coding->dst_multibyte = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7281 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7282
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7283 decode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7284
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7285 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7286 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7287
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7288 if (! NILP (CODING_ATTR_POST_READ (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7289 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7290 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7291 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7292 Lisp_Object val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7293
88506
a7f0d13affa5 (decode_coding_object): Move point to coding->dst_pos before
Kenichi Handa <handa@m17n.org>
parents: 88497
diff changeset
7294 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7295 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7296 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7297 val = safe_call1 (CODING_ATTR_POST_READ (attrs),
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7298 make_number (coding->produced_char));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7299 UNGCPRO;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7300 CHECK_NATNUM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7301 coding->produced_char += Z - prev_Z;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7302 coding->produced += Z_BYTE - prev_Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7303 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7304
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7305 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7306 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7307 coding->dst_object = Fbuffer_string ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7308 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7309 else if (NILP (dst_object) && BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7310 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7311 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7312 if (dst_bytes < coding->produced)
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
7313 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7314 destination = xrealloc (destination, coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7315 if (! destination)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7316 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7317 record_conversion_result (coding,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7318 CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7319 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7320 return;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7321 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7322 if (BEGV < GPT && GPT < BEGV + coding->produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7323 move_gap_both (BEGV, BEGV_BYTE);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7324 bcopy (BEGV_ADDR, destination, coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7325 coding->destination = destination;
23279
ca159e828a68 (ccl_coding_driver): If ccl_driver is interrupted by a
Kenichi Handa <handa@m17n.org>
parents: 23258
diff changeset
7326 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7327 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7328
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7329 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7330 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7331 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7332 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7333 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7334 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7335 set_buffer_internal (XBUFFER (src_object));
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7336 current_buffer->text->inhibit_shrinking = 0;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7337 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7338 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7339 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7340 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7341 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7342 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7343 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7344 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7345 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7346 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7347
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7348 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7349 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7350 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7351
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7352 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7353 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7354 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7355 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7356 if (tail->insertion_type)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7357 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7358 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7359 tail->charpos = from;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7360 }
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7361 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7362 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7363 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7364 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7365 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7366 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7367 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7368 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7369 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7370 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7371
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7372 Vdeactivate_mark = old_deactivate_mark;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7373 unbind_to (count, coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7374 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7375
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7376
29275
b4ea9178e480 (DECODE_COMPOSITION_START): If coding->cmp_data is not
Kenichi Handa <handa@m17n.org>
parents: 29247
diff changeset
7377 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7378 encode_coding_object (coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7379 dst_object)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7380 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7381 Lisp_Object src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7382 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7383 Lisp_Object dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7384 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7385 int count = specpdl_ptr - specpdl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7386 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7387 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7388 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7389 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7390 int need_marker_adjustment = 0;
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7391 int kill_src_buffer = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7392 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7393
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7394 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7395
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7396 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7397 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7398 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7399 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7400
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7401 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7402
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7403 if (EQ (src_object, dst_object))
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7404 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7405 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7406
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7407 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7408 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7409 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7410 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7411 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7412 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7413 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7414
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7415 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
21062
839b22ad1e42 (code_convert_region): Handle the case that codes
Kenichi Handa <handa@m17n.org>
parents: 20999
diff changeset
7416 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7417 coding->src_object = code_conversion_save (1, coding->src_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7418 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7419 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7420 insert_from_string (src_object, from, from_byte, chars, bytes, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7421 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7422 insert_from_buffer (XBUFFER (src_object), from, chars, 0);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7423 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7424 insert_1_both (coding->source + from, chars, bytes, 0, 0, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7425
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7426 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7427 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7428 set_buffer_internal (XBUFFER (src_object));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7429 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7430 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7431 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7432 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7433
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7434 {
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7435 Lisp_Object args[3];
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7436 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7437
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7438 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7439 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7440 args[0] = CODING_ATTR_PRE_WRITE (attrs);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7441 args[1] = make_number (BEG);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7442 args[2] = make_number (Z);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7443 safe_call (3, args);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7444 UNGCPRO;
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7445 }
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7446 if (XBUFFER (coding->src_object) != current_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7447 kill_src_buffer = 1;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7448 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7449 if (BEG != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7450 move_gap_both (BEG, BEG_BYTE);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7451 coding->src_chars = Z - BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7452 coding->src_bytes = Z_BYTE - BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7453 coding->src_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7454 coding->src_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7455 coding->src_multibyte = Z < Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7456 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7457 else if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7458 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7459 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7460 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7461 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7462 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7463 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7464 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7465 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7466 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7467 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7468 {
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7469 saved_pt = PT, saved_pt_byte = PT_BYTE;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7470 coding->src_object = del_range_1 (from, to, 1, 1);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7471 coding->src_pos = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7472 coding->src_pos_byte = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7473 }
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
7474 else
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
7475 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7476 if (from < GPT && to >= GPT)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7477 move_gap_both (from, from_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7478 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7479 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7480 }
64308
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
7481 }
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
7482 else
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7483 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7484
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7485 if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7486 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7487 coding->dst_object = dst_object;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7488 if (EQ (src_object, dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7489 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7490 coding->dst_pos = from;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7491 coding->dst_pos_byte = from_byte;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7492 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7493 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7494 {
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7495 struct buffer *current = current_buffer;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7496
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7497 set_buffer_temp (XBUFFER (dst_object));
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7498 coding->dst_pos = PT;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7499 coding->dst_pos_byte = PT_BYTE;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7500 move_gap_both (coding->dst_pos, coding->dst_pos_byte);
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
7501 set_buffer_temp (current);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
7502 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7503 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7504 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7505 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7506 else if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7507 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7508 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7509 coding->dst_bytes = coding->src_chars;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7510 if (coding->dst_bytes == 0)
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7511 coding->dst_bytes = 1;
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7512 coding->destination = (unsigned char *) xmalloc (coding->dst_bytes);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7513 coding->dst_multibyte = 0;
65506
f376635f5061 (code_convert_region_unwind): Argument format changed.
Kenichi Handa <handa@m17n.org>
parents: 64770
diff changeset
7514 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7515 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
7516 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7517 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7518 coding->dst_multibyte = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7519 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7520
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7521 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7522
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7523 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7524 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7525 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7526 coding->dst_object = Fbuffer_string ();
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
7527 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7528 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7529 coding->dst_object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7530 = make_unibyte_string ((char *) coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7531 coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7532 xfree (coding->destination);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7533 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7534 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7535
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7536 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7537 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7538 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7539 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7540 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7541 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7542 set_buffer_internal (XBUFFER (src_object));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7543 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7544 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7545 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7546 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7547 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7548 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7549 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7550 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7551 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7552 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7553
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7554 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7555 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7556 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7557
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7558 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7559 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7560 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7561 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7562 if (tail->insertion_type)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7563 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7564 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7565 tail->charpos = from;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7566 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7567 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7568 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7569 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7570 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7571 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7572 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7573 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7574 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7575 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7576 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7577
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7578 if (kill_src_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7579 Fkill_buffer (coding->src_object);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7580
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7581 Vdeactivate_mark = old_deactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7582 unbind_to (count, Qnil);
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
7583 }
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
7584
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
7585
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7586 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7587 preferred_coding_system ()
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7588 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7589 int id = coding_categories[coding_priorities[0]].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7590
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7591 return CODING_ID_NAME (id);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7592 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7593
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7594
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7595 #ifdef emacs
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
7596 /*** 8. Emacs Lisp library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7597
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7598 DEFUN ("coding-system-p", Fcoding_system_p, Scoding_system_p, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7599 doc: /* Return t if OBJECT is nil or a coding-system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7600 See the documentation of `define-coding-system' for information
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7601 about coding-system objects. */)
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7602 (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7603 Lisp_Object object;
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7604 {
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7605 if (NILP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7606 || CODING_SYSTEM_ID (object) >= 0)
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
7607 return Qt;
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7608 if (! SYMBOLP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
7609 || NILP (Fget (object, Qcoding_system_define_form)))
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
7610 return Qnil;
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
7611 return Qt;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7612 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7613
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
7614 DEFUN ("read-non-nil-coding-system", Fread_non_nil_coding_system,
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
7615 Sread_non_nil_coding_system, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7616 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7617 (prompt)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7618 Lisp_Object prompt;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7619 {
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
7620 Lisp_Object val;
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
7621 do
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
7622 {
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
7623 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
7624 Qt, Qnil, Qcoding_system_history, Qnil, Qnil);
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
7625 }
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
7626 while (SCHARS (val) == 0);
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
7627 return (Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7628 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7629
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
7630 DEFUN ("read-coding-system", Fread_coding_system, Sread_coding_system, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7631 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT.
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7632 If the user enters null input, return second argument DEFAULT-CODING-SYSTEM.
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7633 Ignores case when completing coding systems (all Emacs coding systems
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7634 are lower-case). */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7635 (prompt, default_coding_system)
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
7636 Lisp_Object prompt, default_coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7637 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
7638 Lisp_Object val;
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7639 int count = SPECPDL_INDEX ();
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7640
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
7641 if (SYMBOLP (default_coding_system))
45396
cab845213388 * coding.c (Fread_coding_system, code_convert_region1)
Ken Raeburn <raeburn@raeburn.org>
parents: 45239
diff changeset
7642 default_coding_system = SYMBOL_NAME (default_coding_system);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7643 specbind (Qcompletion_ignore_case, Qt);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
7644 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
7645 Qt, Qnil, Qcoding_system_history,
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
7646 default_coding_system, Qnil);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
7647 unbind_to (count, Qnil);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
7648 return (SCHARS (val) == 0 ? Qnil : Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7649 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7650
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7651 DEFUN ("check-coding-system", Fcheck_coding_system, Scheck_coding_system,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7652 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7653 doc: /* Check validity of CODING-SYSTEM.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
7654 If valid, return CODING-SYSTEM, else signal a `coding-system-error' error.
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
7655 It is valid if it is nil or a symbol defined as a coding system by the
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
7656 function `define-coding-system'. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7657 (coding_system)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7658 Lisp_Object coding_system;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7659 {
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7660 Lisp_Object define_form;
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7661
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7662 define_form = Fget (coding_system, Qcoding_system_define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7663 if (! NILP (define_form))
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7664 {
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7665 Fput (coding_system, Qcoding_system_define_form, Qnil);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7666 safe_eval (define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
7667 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7668 if (!NILP (Fcoding_system_p (coding_system)))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7669 return coding_system;
71972
eaa3c19b94d2 (Fcheck_coding_system): Use xsignal1. Remove loop.
Kim F. Storm <storm@cua.dk>
parents: 71084
diff changeset
7670 xsignal1 (Qcoding_system_error, coding_system);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7671 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7672
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
7673
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7674 /* Detect how the bytes at SRC of length SRC_BYTES are encoded. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7675 HIGHEST is nonzero, return the coding system of the highest
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7676 priority among the detected coding systems. Otherwize return a
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7677 list of detected coding systems sorted by their priorities. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7678 MULTIBYTEP is nonzero, it is assumed that the bytes are in correct
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7679 multibyte form but contains only ASCII and eight-bit chars.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7680 Otherwise, the bytes are raw bytes.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7681
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7682 CODING-SYSTEM controls the detection as below:
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7683
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7684 If it is nil, detect both text-format and eol-format. If the
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7685 text-format part of CODING-SYSTEM is already specified
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7686 (e.g. `iso-latin-1'), detect only eol-format. If the eol-format
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7687 part of CODING-SYSTEM is already specified (e.g. `undecided-unix'),
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7688 detect only text-format. */
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7689
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7690 Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7691 detect_coding_system (src, src_chars, src_bytes, highest, multibytep,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7692 coding_system)
46548
cb1914307488 (encode_eol, detect_coding, detect_eol):
Ken Raeburn <raeburn@raeburn.org>
parents: 46462
diff changeset
7693 const unsigned char *src;
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
7694 EMACS_INT src_chars, src_bytes;
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
7695 int highest;
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
7696 int multibytep;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7697 Lisp_Object coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7698 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7699 const unsigned char *src_end = src + src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7700 Lisp_Object attrs, eol_type;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
7701 Lisp_Object val = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7702 struct coding_system coding;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7703 int id;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7704 struct coding_detection_info detect_info;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7705 enum coding_category base_category;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7706 int null_byte_found = 0, eight_bit_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7707
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7708 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7709 coding_system = Qundecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7710 setup_coding_system (coding_system, &coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7711 attrs = CODING_ID_ATTRS (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7712 eol_type = CODING_ID_EOL_TYPE (coding.id);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7713 coding_system = CODING_ATTR_BASE_NAME (attrs);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7714
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7715 coding.source = src;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7716 coding.src_chars = src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7717 coding.src_bytes = src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7718 coding.src_multibyte = multibytep;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7719 coding.consumed = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7720 coding.mode |= CODING_MODE_LAST_BLOCK;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7721 coding.head_ascii = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7722
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7723 detect_info.checked = detect_info.found = detect_info.rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7724
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7725 /* At first, detect text-format if necessary. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7726 base_category = XINT (CODING_ATTR_CATEGORY (attrs));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7727 if (base_category == coding_category_undecided)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7728 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7729 enum coding_category category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7730 struct coding_system *this;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7731 int c, i;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7732
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7733 /* Skip all ASCII bytes except for a few ISO2022 controls. */
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7734 for (; src < src_end; src++)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7735 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7736 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7737 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7738 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7739 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7740 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7741 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7742 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7743 else if (c < 0x20)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7744 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7745 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7746 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7747 && ! detect_info.checked)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7748 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7749 if (detect_coding_iso_2022 (&coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7750 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7751 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7752 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7753 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7754 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7755 have found a null-byte, but it's very
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7756 rare that a binary file confirm to
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7757 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7758 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7759 coding.head_ascii = src - coding.source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7760 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7761 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7762 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7763 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7764 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7765 else if (! c)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7766 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7767 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7768 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7769 break;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7770 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
7771 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
7772 coding.head_ascii++;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7773 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
7774 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7775 coding.head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
7776 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7777
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7778 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7779 || coding.head_ascii < coding.src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7780 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7781 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7782 if (coding.head_ascii == coding.src_bytes)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7783 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7784 for (i = 0; i < coding_category_raw_text; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7785 {
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7786 category = coding_priorities[i];
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
7787 this = coding_categories + category;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7788 if (detect_info.found & (1 << category))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7789 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7790 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7791 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7792 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7793 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7794 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7795 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7796 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7797 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7798 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7799 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7800 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7801 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7802
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7803 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7804 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7805 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7806 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7807 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7808 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7809 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7810 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7811 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7812 if (highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7813 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7814 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7815 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7816 else if ((*(this->detector)) (&coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7817 && highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7818 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7819 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7820 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7821 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7822 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7823 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7824 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7825 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7826 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
7827 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7828 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7829 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7830 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7831 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7832
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7833 if ((detect_info.rejected & CATEGORY_MASK_ANY) == CATEGORY_MASK_ANY)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7834 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7835 detect_info.found = CATEGORY_MASK_RAW_TEXT;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7836 id = coding_categories[coding_category_raw_text].id;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7837 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7838 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7839 else if (! detect_info.rejected && ! detect_info.found)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7840 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7841 detect_info.found = CATEGORY_MASK_ANY;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7842 id = coding_categories[coding_category_undecided].id;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7843 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7844 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7845 else if (highest)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7846 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7847 if (detect_info.found)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7848 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7849 detect_info.found = 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7850 val = Fcons (make_number (this->id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7851 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7852 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7853 for (i = 0; i < coding_category_raw_text; i++)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7854 if (! (detect_info.rejected & (1 << coding_priorities[i])))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7855 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7856 detect_info.found = 1 << coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7857 id = coding_categories[coding_priorities[i]].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7858 val = Fcons (make_number (id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7859 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7860 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7861 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7862 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7863 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7864 int mask = detect_info.rejected | detect_info.found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7865 int found = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7866
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7867 for (i = coding_category_raw_text - 1; i >= 0; i--)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7868 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7869 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7870 if (! (mask & (1 << category)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7871 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7872 found |= 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7873 id = coding_categories[category].id;
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
7874 if (id >= 0)
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
7875 val = Fcons (make_number (id), val);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7876 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7877 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7878 for (i = coding_category_raw_text - 1; i >= 0; i--)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7879 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7880 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7881 if (detect_info.found & (1 << category))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7882 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7883 id = coding_categories[category].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7884 val = Fcons (make_number (id), val);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7885 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7886 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7887 detect_info.found |= found;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7888 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7889 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7890 else if (base_category == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7891 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7892 if (detect_coding_utf_8 (&coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7893 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7894 struct coding_system *this;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7895
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7896 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7897 this = coding_categories + coding_category_utf_8_sig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7898 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7899 this = coding_categories + coding_category_utf_8_nosig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7900 val = Fcons (make_number (this->id), Qnil);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7901 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
7902 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7903 else if (base_category == coding_category_utf_16_auto)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7904 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7905 if (detect_coding_utf_16 (&coding, &detect_info))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7906 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7907 struct coding_system *this;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7908
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7909 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7910 this = coding_categories + coding_category_utf_16_le;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7911 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7912 this = coding_categories + coding_category_utf_16_be;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7913 else if (detect_info.rejected & CATEGORY_MASK_UTF_16_LE_NOSIG)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7914 this = coding_categories + coding_category_utf_16_be_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7915 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7916 this = coding_categories + coding_category_utf_16_le_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7917 val = Fcons (make_number (this->id), Qnil);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7918 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7919 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7920 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7921 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7922 detect_info.found = 1 << XINT (CODING_ATTR_CATEGORY (attrs));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7923 val = Fcons (make_number (coding.id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7924 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7925
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7926 /* Then, detect eol-format if necessary. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7927 {
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
7928 int normal_eol = -1, utf_16_be_eol = -1, utf_16_le_eol = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7929 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7930
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7931 if (VECTORP (eol_type))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7932 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7933 if (detect_info.found & ~CATEGORY_MASK_UTF_16)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7934 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7935 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7936 normal_eol = EOL_SEEN_LF;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7937 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7938 normal_eol = detect_eol (coding.source, src_bytes,
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7939 coding_category_raw_text);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
7940 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7941 if (detect_info.found & (CATEGORY_MASK_UTF_16_BE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7942 | CATEGORY_MASK_UTF_16_BE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7943 utf_16_be_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7944 coding_category_utf_16_be);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7945 if (detect_info.found & (CATEGORY_MASK_UTF_16_LE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7946 | CATEGORY_MASK_UTF_16_LE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7947 utf_16_le_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7948 coding_category_utf_16_le);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7949 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7950 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7951 {
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7952 if (EQ (eol_type, Qunix))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7953 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_LF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7954 else if (EQ (eol_type, Qdos))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7955 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CRLF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7956 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7957 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CR;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7958 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7959
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7960 for (tail = val; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7961 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7962 enum coding_category category;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7963 int this_eol;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7964
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7965 id = XINT (XCAR (tail));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7966 attrs = CODING_ID_ATTRS (id);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7967 category = XINT (CODING_ATTR_CATEGORY (attrs));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7968 eol_type = CODING_ID_EOL_TYPE (id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7969 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7970 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7971 if (category == coding_category_utf_16_be
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7972 || category == coding_category_utf_16_be_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7973 this_eol = utf_16_be_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7974 else if (category == coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7975 || category == coding_category_utf_16_le_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7976 this_eol = utf_16_le_eol;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7977 else
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7978 this_eol = normal_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7979
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7980 if (this_eol == EOL_SEEN_LF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7981 XSETCAR (tail, AREF (eol_type, 0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7982 else if (this_eol == EOL_SEEN_CRLF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7983 XSETCAR (tail, AREF (eol_type, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7984 else if (this_eol == EOL_SEEN_CR)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7985 XSETCAR (tail, AREF (eol_type, 2));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7986 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7987 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7988 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7989 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
7990 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7991 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7992 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7993
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
7994 return (highest ? (CONSP (val) ? XCAR (val) : Qnil) : val);
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
7995 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7996
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7997
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7998 DEFUN ("detect-coding-region", Fdetect_coding_region, Sdetect_coding_region,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7999 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8000 doc: /* Detect coding system of the text in the region between START and END.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8001 Return a list of possible coding systems ordered by priority.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8002
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8003 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8004 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8005 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8006 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8007
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8008 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8009 highest priority. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8010 (start, end, highest)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8011 Lisp_Object start, end, highest;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8012 {
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8013 int from, to;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8014 int from_byte, to_byte;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8015
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8016 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8017 CHECK_NUMBER_COERCE_MARKER (end);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8018
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8019 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8020 from = XINT (start), to = XINT (end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8021 from_byte = CHAR_TO_BYTE (from);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8022 to_byte = CHAR_TO_BYTE (to);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8023
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8024 if (from < GPT && to >= GPT)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8025 move_gap_both (to, to_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8026
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8027 return detect_coding_system (BYTE_POS_ADDR (from_byte),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8028 to - from, to_byte - from_byte,
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8029 !NILP (highest),
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8030 !NILP (current_buffer
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8031 ->enable_multibyte_characters),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8032 Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8033 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8034
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8035 DEFUN ("detect-coding-string", Fdetect_coding_string, Sdetect_coding_string,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8036 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8037 doc: /* Detect coding system of the text in STRING.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8038 Return a list of possible coding systems ordered by priority.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8039
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8040 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8041 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8042 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8043 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8044
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8045 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8046 highest priority. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8047 (string, highest)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8048 Lisp_Object string, highest;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8049 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8050 CHECK_STRING (string);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8051
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8052 return detect_coding_system (SDATA (string),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8053 SCHARS (string), SBYTES (string),
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8054 !NILP (highest), STRING_MULTIBYTE (string),
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8055 Qnil);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8056 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8057
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8058
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8059 static INLINE int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8060 char_encodable_p (c, attrs)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8061 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8062 Lisp_Object attrs;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8063 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8064 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8065 struct charset *charset;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8066 Lisp_Object translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8067
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8068 translation_table = CODING_ATTR_TRANS_TBL (attrs);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
8069 if (! NILP (translation_table))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8070 c = translate_char (translation_table, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8071 for (tail = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8072 CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8073 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8074 charset = CHARSET_FROM_ID (XINT (XCAR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8075 if (CHAR_CHARSET_P (c, charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8076 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8077 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8078 return (! NILP (tail));
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8079 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8080
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8081
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8082 /* Return a list of coding systems that safely encode the text between
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8083 START and END. If EXCLUDE is non-nil, it is a list of coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8084 systems not to check. The returned list doesn't contain any such
88889
4548f224c603 (Ffind_coding_systems_region_internal): Detect an
Kenichi Handa <handa@m17n.org>
parents: 88876
diff changeset
8085 coding systems. In any case, if the text contains only ASCII or is
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8086 unibyte, return t. */
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8087
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8088 DEFUN ("find-coding-systems-region-internal",
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8089 Ffind_coding_systems_region_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8090 Sfind_coding_systems_region_internal, 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8091 doc: /* Internal use only. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8092 (start, end, exclude)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8093 Lisp_Object start, end, exclude;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8094 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8095 Lisp_Object coding_attrs_list, safe_codings;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8096 EMACS_INT start_byte, end_byte;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8097 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8098 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8099 Lisp_Object tail, elt;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8100
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8101 if (STRINGP (start))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8102 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8103 if (!STRING_MULTIBYTE (start)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8104 || SCHARS (start) == SBYTES (start))
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8105 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8106 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8107 end_byte = SBYTES (start);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8108 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8109 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8110 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8111 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8112 CHECK_NUMBER_COERCE_MARKER (end);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8113 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8114 args_out_of_range (start, end);
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8115 if (NILP (current_buffer->enable_multibyte_characters))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8116 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8117 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8118 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8119 if (XINT (end) - XINT (start) == end_byte - start_byte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8120 return Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8121
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8122 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8123 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8124 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8125 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8126 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8127 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8128 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8129 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8130
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8131 coding_attrs_list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8132 for (tail = Vcoding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8133 if (NILP (exclude)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8134 || NILP (Fmemq (XCAR (tail), exclude)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8135 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8136 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8137
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8138 attrs = AREF (CODING_SYSTEM_SPEC (XCAR (tail)), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8139 if (EQ (XCAR (tail), CODING_ATTR_BASE_NAME (attrs))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8140 && ! EQ (CODING_ATTR_TYPE (attrs), Qundecided))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8141 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8142 ASET (attrs, coding_attr_trans_tbl,
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8143 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8144 coding_attrs_list = Fcons (attrs, coding_attrs_list);
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8145 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8146 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8147
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8148 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8149 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8150 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8151 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8152 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8153
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8154 while (p < pend && ASCII_BYTE_P (*p)) p++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8155 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8156
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8157 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8158 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8159 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8160 p++;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8161 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8162 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8163 c = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8164
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8165 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8166 for (tail = coding_attrs_list; CONSP (tail);)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8167 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8168 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8169 if (NILP (elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8170 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8171 else if (char_encodable_p (c, elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8172 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8173 else if (CONSP (XCDR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8174 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8175 XSETCAR (tail, XCAR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8176 XSETCDR (tail, XCDR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8177 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8178 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8179 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8180 XSETCAR (tail, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8181 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8182 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8183 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8184 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8185 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8186 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8187
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8188 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8189 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8190 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8191 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8192 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8193 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8194 }
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8195 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8196 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8197
89905
37e044cc35f6 (Ffind_coding_systems_region_internal): Include raw-text and
Kenichi Handa <handa@m17n.org>
parents: 89892
diff changeset
8198 safe_codings = list2 (Qraw_text, Qno_conversion);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8199 for (tail = coding_attrs_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8200 if (! NILP (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8201 safe_codings = Fcons (CODING_ATTR_BASE_NAME (XCAR (tail)), safe_codings);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8202
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8203 return safe_codings;
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8204 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8205
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8206
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8207 DEFUN ("unencodable-char-position", Funencodable_char_position,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8208 Sunencodable_char_position, 3, 5, 0,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8209 doc: /*
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8210 Return position of first un-encodable character in a region.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8211 START and END specify the region and CODING-SYSTEM specifies the
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8212 encoding to check. Return nil if CODING-SYSTEM does encode the region.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8213
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8214 If optional 4th argument COUNT is non-nil, it specifies at most how
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8215 many un-encodable characters to search. In this case, the value is a
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8216 list of positions.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8217
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8218 If optional 5th argument STRING is non-nil, it is a string to search
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8219 for un-encodable characters. In that case, START and END are indexes
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8220 to the string. */)
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8221 (start, end, coding_system, count, string)
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8222 Lisp_Object start, end, coding_system, count, string;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8223 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8224 int n;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8225 struct coding_system coding;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8226 Lisp_Object attrs, charset_list, translation_table;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8227 Lisp_Object positions;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8228 int from, to;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8229 const unsigned char *p, *stop, *pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8230 int ascii_compatible;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8231
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8232 setup_coding_system (Fcheck_coding_system (coding_system), &coding);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8233 attrs = CODING_ID_ATTRS (coding.id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8234 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8235 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8236 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8237 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8238 translation_table = get_translation_table (attrs, 1, NULL);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8239
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8240 if (NILP (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8241 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8242 validate_region (&start, &end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8243 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8244 to = XINT (end);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8245 if (NILP (current_buffer->enable_multibyte_characters)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8246 || (ascii_compatible
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8247 && (to - from) == (CHAR_TO_BYTE (to) - (CHAR_TO_BYTE (from)))))
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8248 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8249 p = CHAR_POS_ADDR (from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8250 pend = CHAR_POS_ADDR (to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8251 if (from < GPT && to >= GPT)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8252 stop = GPT_ADDR;
48829
f6c59ca557c7 (Funencodable_char_position): Set pend correctly.
Kenichi Handa <handa@m17n.org>
parents: 48230
diff changeset
8253 else
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8254 stop = pend;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8255 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8256 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8257 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8258 CHECK_STRING (string);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8259 CHECK_NATNUM (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8260 CHECK_NATNUM (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8261 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8262 to = XINT (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8263 if (from > to
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8264 || to > SCHARS (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8265 args_out_of_range_3 (string, start, end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8266 if (! STRING_MULTIBYTE (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8267 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8268 p = SDATA (string) + string_char_to_byte (string, from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8269 stop = pend = SDATA (string) + string_char_to_byte (string, to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8270 if (ascii_compatible && (to - from) == (pend - p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8271 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8272 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8273
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8274 if (NILP (count))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8275 n = 1;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8276 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8277 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8278 CHECK_NATNUM (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8279 n = XINT (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8280 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8281
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8282 positions = Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8283 while (1)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8284 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8285 int c;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8286
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8287 if (ascii_compatible)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8288 while (p < stop && ASCII_BYTE_P (*p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8289 p++, from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8290 if (p >= stop)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8291 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8292 if (p >= pend)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8293 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8294 stop = pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8295 p = GAP_END_ADDR;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8296 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8297
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8298 c = STRING_CHAR_ADVANCE (p);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8299 if (! (ASCII_CHAR_P (c) && ascii_compatible)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8300 && ! char_charset (translate_char (translation_table, c),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8301 charset_list, NULL))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8302 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8303 positions = Fcons (make_number (from), positions);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8304 n--;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8305 if (n == 0)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8306 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8307 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8308
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8309 from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8310 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8311
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8312 return (NILP (count) ? Fcar (positions) : Fnreverse (positions));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8313 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8314
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8315
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8316 DEFUN ("check-coding-systems-region", Fcheck_coding_systems_region,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8317 Scheck_coding_systems_region, 3, 3, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8318 doc: /* Check if the region is encodable by coding systems.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8319
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8320 START and END are buffer positions specifying the region.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8321 CODING-SYSTEM-LIST is a list of coding systems to check.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8322
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8323 The value is an alist ((CODING-SYSTEM POS0 POS1 ...) ...), where
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8324 CODING-SYSTEM is a member of CODING-SYSTEM-LIST and can't encode the
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8325 whole region, POS0, POS1, ... are buffer positions where non-encodable
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8326 characters are found.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8327
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8328 If all coding systems in CODING-SYSTEM-LIST can encode the region, the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8329 value is nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8330
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8331 START may be a string. In that case, check if the string is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8332 encodable, and the value contains indices to the string instead of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8333 buffer positions. END is ignored. */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8334 (start, end, coding_system_list)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8335 Lisp_Object start, end, coding_system_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8336 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8337 Lisp_Object list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8338 EMACS_INT start_byte, end_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8339 int pos;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8340 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8341 int c;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8342 Lisp_Object tail, elt, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8343
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8344 if (STRINGP (start))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8345 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8346 if (!STRING_MULTIBYTE (start)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8347 && SCHARS (start) != SBYTES (start))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8348 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8349 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8350 end_byte = SBYTES (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8351 pos = 0;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8352 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8353 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8354 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8355 CHECK_NUMBER_COERCE_MARKER (start);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8356 CHECK_NUMBER_COERCE_MARKER (end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8357 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8358 args_out_of_range (start, end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8359 if (NILP (current_buffer->enable_multibyte_characters))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8360 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8361 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8362 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8363 if (XINT (end) - XINT (start) == end_byte - start_byte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8364 return Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8365
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8366 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8367 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8368 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8369 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8370 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8371 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8372 }
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8373 pos = XINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8374 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8375
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8376 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8377 for (tail = coding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8378 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8379 elt = XCAR (tail);
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8380 attrs = AREF (CODING_SYSTEM_SPEC (elt), 0);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8381 ASET (attrs, coding_attr_trans_tbl,
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8382 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8383 list = Fcons (Fcons (elt, Fcons (attrs, Qnil)), list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8384 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8385
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8386 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8387 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8388 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8389 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8390 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8391
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8392 while (p < pend && ASCII_BYTE_P (*p)) p++, pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8393 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8394
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8395 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8396 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8397 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8398 p++;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8399 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8400 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8401 c = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8402
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8403 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8404 for (tail = list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8405 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8406 elt = XCDR (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8407 if (! char_encodable_p (c, XCAR (elt)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8408 XSETCDR (elt, Fcons (make_number (pos), XCDR (elt)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8409 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8410 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8411 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8412 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8413
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8414 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8415 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8416 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8417 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8418 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8419 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8420 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8421 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8422 pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8423 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8424
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8425 tail = list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8426 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8427 for (; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8428 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8429 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8430 if (CONSP (XCDR (XCDR (elt))))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8431 list = Fcons (Fcons (XCAR (elt), Fnreverse (XCDR (XCDR (elt)))),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8432 list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8433 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8434
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8435 return list;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8436 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8437
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8438
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8439 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8440 code_convert_region (start, end, coding_system, dst_object, encodep, norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8441 Lisp_Object start, end, coding_system, dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8442 int encodep, norecord;
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8443 {
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8444 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8445 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8446 Lisp_Object src_object;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8447
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8448 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8449 CHECK_NUMBER_COERCE_MARKER (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8450 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8451 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8452 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8453 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8454 src_object = Fcurrent_buffer ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8455 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8456 dst_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8457 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8458 CHECK_BUFFER (dst_object);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8459
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8460 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8461 from = XFASTINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8462 from_byte = CHAR_TO_BYTE (from);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8463 to = XFASTINT (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8464 to_byte = CHAR_TO_BYTE (to);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8465
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8466 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8467 coding.mode |= CODING_MODE_LAST_BLOCK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8468
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8469 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8470 encode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8471 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8472 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8473 decode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8474 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8475 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8476 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8477
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8478 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8479 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8480 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8481 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8482
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8483
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8484 DEFUN ("decode-coding-region", Fdecode_coding_region, Sdecode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8485 3, 4, "r\nzCoding system: ",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8486 doc: /* Decode the current region from the specified coding system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8487 When called from a program, takes four arguments:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8488 START, END, CODING-SYSTEM, and DESTINATION.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8489 START and END are buffer positions.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8490
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8491 Optional 4th arguments DESTINATION specifies where the decoded text goes.
91083
ff87badce376 (Fdecode_coding_region): Fix typo in docstring.
Kenichi Handa <handa@m17n.org>
parents: 91056
diff changeset
8492 If nil, the region between START and END is replaced by the decoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8493 If buffer, the decoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8494 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
8495 In those cases, the length of the decoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8496 If DESTINATION is t, the decoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8497
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8498 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8499 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8500 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8501 (start, end, coding_system, destination)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8502 Lisp_Object start, end, coding_system, destination;
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8503 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8504 return code_convert_region (start, end, coding_system, destination, 0, 0);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8505 }
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8506
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8507 DEFUN ("encode-coding-region", Fencode_coding_region, Sencode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8508 3, 4, "r\nzCoding system: ",
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8509 doc: /* Encode the current region by specified coding system.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8510 When called from a program, takes four arguments:
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8511 START, END, CODING-SYSTEM and DESTINATION.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8512 START and END are buffer positions.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8513
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8514 Optional 4th arguments DESTINATION specifies where the encoded text goes.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8515 If nil, the region between START and END is replace by the encoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8516 If buffer, the encoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8517 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
8518 In those cases, the length of the encoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8519 If DESTINATION is t, the encoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8520
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8521 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8522 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8523 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8524 (start, end, coding_system, destination)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8525 Lisp_Object start, end, coding_system, destination;
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8526 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8527 return code_convert_region (start, end, coding_system, destination, 1, 0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8528 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8529
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8530 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8531 code_convert_string (string, coding_system, dst_object,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8532 encodep, nocopy, norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8533 Lisp_Object string, coding_system, dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8534 int encodep, nocopy, norecord;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8535 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8536 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8537 EMACS_INT chars, bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8538
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8539 CHECK_STRING (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8540 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8541 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8542 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8543 Vlast_coding_system_used = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8544 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8545 return (nocopy ? Fcopy_sequence (string) : string);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8546 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8547
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
8548 if (NILP (coding_system))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8549 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8550 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8551 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8552 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8553 dst_object = Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8554 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8555 CHECK_BUFFER (dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8556
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8557 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8558 coding.mode |= CODING_MODE_LAST_BLOCK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8559 chars = SCHARS (string);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8560 bytes = SBYTES (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8561 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8562 encode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8563 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8564 decode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8565 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8566 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8567
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8568 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8569 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8570 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8571 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8572
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8573
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8574 /* Encode or decode STRING according to CODING_SYSTEM.
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
8575 Do not set Vlast_coding_system_used.
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
8576
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
8577 This function is called only from macros DECODE_FILE and
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
8578 ENCODE_FILE, thus we ignore character composition. */
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8579
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8580 Lisp_Object
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8581 code_convert_string_norecord (string, coding_system, encodep)
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8582 Lisp_Object string, coding_system;
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8583 int encodep;
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8584 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
8585 return code_convert_string (string, coding_system, Qt, encodep, 0, 1);
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
8586 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8587
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8588
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8589 DEFUN ("decode-coding-string", Fdecode_coding_string, Sdecode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8590 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8591 doc: /* Decode STRING which is encoded in CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8592
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8593 Optional third arg NOCOPY non-nil means it is OK to return STRING itself
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8594 if the decoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8595
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8596 Optional fourth arg BUFFER non-nil means that the decoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8597 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8598 case, the return value is the length of the decoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8599
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8600 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8601 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8602 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8603 (string, coding_system, nocopy, buffer)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8604 Lisp_Object string, coding_system, nocopy, buffer;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8605 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8606 return code_convert_string (string, coding_system, buffer,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8607 0, ! NILP (nocopy), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8608 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8609
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8610 DEFUN ("encode-coding-string", Fencode_coding_string, Sencode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8611 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8612 doc: /* Encode STRING to CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8613
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8614 Optional third arg NOCOPY non-nil means it is OK to return STRING
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8615 itself if the encoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8616
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8617 Optional fourth arg BUFFER non-nil means that the encoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8618 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
8619 case, the return value is the length of the encoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8620
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8621 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8622 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8623 not fully specified.) */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8624 (string, coding_system, nocopy, buffer)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8625 Lisp_Object string, coding_system, nocopy, buffer;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8626 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8627 return code_convert_string (string, coding_system, buffer,
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
8628 1, ! NILP (nocopy), 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8629 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8630
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8631
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8632 DEFUN ("decode-sjis-char", Fdecode_sjis_char, Sdecode_sjis_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8633 doc: /* Decode a Japanese character which has CODE in shift_jis encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8634 Return the corresponding character. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8635 (code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8636 Lisp_Object code;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8637 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8638 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8639 struct charset *charset_roman, *charset_kanji, *charset_kana, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8640 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8641
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8642 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8643 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8644 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8645 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8646
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8647 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8648 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8649 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8650
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8651 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8652 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
8653 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
8654 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8655
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8656 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8657 charset = charset_roman;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8658 else if (c >= 0xA0 && c < 0xDF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8659 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8660 charset = charset_kana;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8661 c -= 0x80;
24065
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
8662 }
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
8663 else
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
8664 {
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
8665 int s1 = c >> 8, s2 = c & 0xFF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8666
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8667 if (s1 < 0x81 || (s1 > 0x9F && s1 < 0xE0) || s1 > 0xEF
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8668 || s2 < 0x40 || s2 == 0x7F || s2 > 0xFC)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8669 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8670 SJIS_TO_JIS (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8671 charset = charset_kanji;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8672 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8673 c = DECODE_CHAR (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8674 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8675 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8676 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8677 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8678
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8679
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8680 DEFUN ("encode-sjis-char", Fencode_sjis_char, Sencode_sjis_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
8681 doc: /* Encode a Japanese character CH to shift_jis encoding.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8682 Return the corresponding code in SJIS. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8683 (ch)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8684 Lisp_Object ch;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8685 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8686 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8687 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8688 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8689 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8691 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8692 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8693 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8694 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8695
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8696 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8697 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8698 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8699
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8700 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8701 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8702 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8703 error ("Can't encode by shift_jis encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8704 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8705
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8706 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8707 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8708
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8709 DEFUN ("decode-big5-char", Fdecode_big5_char, Sdecode_big5_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8710 doc: /* Decode a Big5 character which has CODE in BIG5 coding system.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8711 Return the corresponding character. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8712 (code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8713 Lisp_Object code;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8714 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8715 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8716 struct charset *charset_roman, *charset_big5, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8717 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8718
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8719 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8720 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8721 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8722 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8723
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8724 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8725 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8726 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8727
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8728 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8729 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8730 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8731
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8732 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8733 charset = charset_roman;
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
8734 else
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
8735 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8736 int b1 = c >> 8, b2 = c & 0x7F;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8737 if (b1 < 0xA1 || b1 > 0xFE
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8738 || b2 < 0x40 || (b2 > 0x7E && b2 < 0xA1) || b2 > 0xFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8739 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8740 charset = charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8741 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8742 c = DECODE_CHAR (charset, (unsigned )c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8743 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8744 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8745 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8746 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8747
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8748 DEFUN ("encode-big5-char", Fencode_big5_char, Sencode_big5_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
8749 doc: /* Encode the Big5 character CH to BIG5 coding system.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8750 Return the corresponding character code in Big5. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8751 (ch)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8752 Lisp_Object ch;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8753 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8754 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8755 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8756 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8757 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8758
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8759 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8760 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8761 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8762 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8763 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8764 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8765 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8766
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8767 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8768 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8769 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8770 error ("Can't encode by Big5 encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8771
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8772 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8773 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8774
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8775
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
8776 DEFUN ("set-terminal-coding-system-internal", Fset_terminal_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
8777 Sset_terminal_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8778 doc: /* Internal use only. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8779 (coding_system, terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8780 Lisp_Object coding_system;
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8781 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8782 {
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8783 struct coding_system *terminal_coding = TERMINAL_TERMINAL_CODING (get_terminal (terminal, 1));
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8784 CHECK_SYMBOL (coding_system);
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
8785 setup_coding_system (Fcheck_coding_system (coding_system), terminal_coding);
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
8786 /* We had better not send unsafe characters to terminal. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
8787 terminal_coding->mode |= CODING_MODE_SAFE_ENCODING;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8788 /* Characer composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
8789 terminal_coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
8790 terminal_coding->src_multibyte = 1;
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
8791 terminal_coding->dst_multibyte = 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8792 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8793 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8794
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8795 DEFUN ("set-safe-terminal-coding-system-internal",
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8796 Fset_safe_terminal_coding_system_internal,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8797 Sset_safe_terminal_coding_system_internal, 1, 1, 0,
41006
fd83ec62a495 Doc fix.
Pavel Janík <Pavel@Janik.cz>
parents: 40842
diff changeset
8798 doc: /* Internal use only. */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8799 (coding_system)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8800 Lisp_Object coding_system;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8801 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8802 CHECK_SYMBOL (coding_system);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8803 setup_coding_system (Fcheck_coding_system (coding_system),
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8804 &safe_terminal_coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8805 /* Characer composition should be disabled. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8806 safe_terminal_coding.common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8807 safe_terminal_coding.src_multibyte = 1;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8808 safe_terminal_coding.dst_multibyte = 0;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8809 return Qnil;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8810 }
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
8811
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
8812 DEFUN ("terminal-coding-system", Fterminal_coding_system,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
8813 Sterminal_coding_system, 0, 1, 0,
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8814 doc: /* Return coding system specified for terminal output on the given terminal.
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8815 TERMINAL may be a terminal id, a frame, or nil for the selected
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8816 frame's terminal device. */)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8817 (terminal)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8818 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8819 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8820 struct coding_system *terminal_coding
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8821 = TERMINAL_TERMINAL_CODING (get_terminal (terminal, 1));
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8822 Lisp_Object coding_system = CODING_ID_NAME (terminal_coding->id);
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8823
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
8824 /* For backward compatibility, return nil if it is `undecided'. */
90359
041f75914d0c (produce_composition): Compare charbuf[i] instead of
Kenichi Handa <handa@m17n.org>
parents: 90354
diff changeset
8825 return (! EQ (coding_system, Qundecided) ? coding_system : Qnil);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8826 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8827
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
8828 DEFUN ("set-keyboard-coding-system-internal", Fset_keyboard_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
8829 Sset_keyboard_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8830 doc: /* Internal use only. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8831 (coding_system, terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8832 Lisp_Object coding_system;
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8833 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8834 {
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8835 struct terminal *t = get_terminal (terminal, 1);
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8836 CHECK_SYMBOL (coding_system);
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
8837 setup_coding_system (Fcheck_coding_system (coding_system),
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
8838 TERMINAL_KEYBOARD_CODING (t));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8839 /* Characer composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
8840 TERMINAL_KEYBOARD_CODING (t)->common_flags
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
8841 &= ~CODING_ANNOTATE_COMPOSITION_MASK;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8842 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8843 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8844
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8845 DEFUN ("keyboard-coding-system",
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8846 Fkeyboard_coding_system, Skeyboard_coding_system, 0, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8847 doc: /* Return coding system specified for decoding keyboard input. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8848 (terminal)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
8849 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8850 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8851 return CODING_ID_NAME (TERMINAL_KEYBOARD_CODING
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
8852 (get_terminal (terminal, 1))->id);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8853 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8854
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8855
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
8856 DEFUN ("find-operation-coding-system", Ffind_operation_coding_system,
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
8857 Sfind_operation_coding_system, 1, MANY, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8858 doc: /* Choose a coding system for an operation based on the target name.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8859 The value names a pair of coding systems: (DECODING-SYSTEM . ENCODING-SYSTEM).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8860 DECODING-SYSTEM is the coding system to use for decoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8861 \(in case OPERATION does decoding), and ENCODING-SYSTEM is the coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8862 for encoding (in case OPERATION does encoding).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8863
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8864 The first argument OPERATION specifies an I/O primitive:
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8865 For file I/O, `insert-file-contents' or `write-region'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8866 For process I/O, `call-process', `call-process-region', or `start-process'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8867 For network I/O, `open-network-stream'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8868
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8869 The remaining arguments should be the same arguments that were passed
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8870 to the primitive. Depending on which primitive, one of those arguments
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8871 is selected as the TARGET. For example, if OPERATION does file I/O,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8872 whichever argument specifies the file name is TARGET.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8873
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8874 TARGET has a meaning which depends on OPERATION:
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8875 For file I/O, TARGET is a file name (except for the special case below).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8876 For process I/O, TARGET is a process name.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8877 For network I/O, TARGET is a service name or a port number.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8878
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8879 This function looks up what is specified for TARGET in
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8880 `file-coding-system-alist', `process-coding-system-alist',
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8881 or `network-coding-system-alist' depending on OPERATION.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8882 They may specify a coding system, a cons of coding systems,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8883 or a function symbol to call.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8884 In the last case, we call the function with one argument,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8885 which is a list of all the arguments given to this function.
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
8886 If the function can't decide a coding system, it can return
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
8887 `undecided' so that the normal code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8888
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8889 If OPERATION is `insert-file-contents', the argument corresponding to
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8890 TARGET may be a cons (FILENAME . BUFFER). In that case, FILENAME is a
71084
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
8891 file name to look up, and BUFFER is a buffer that contains the file's
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
8892 contents (not yet decoded). If `file-coding-system-alist' specifies a
71070
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
8893 function to call for FILENAME, that function should examine the
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
8894 contents of BUFFER instead of reading the file.
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8895
78152
5e5f359984e5 (Ffind_operation_coding_system): Doc fix.
Juanma Barranquero <lekktu@gmail.com>
parents: 75348
diff changeset
8896 usage: (find-operation-coding-system OPERATION ARGUMENTS...) */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8897 (nargs, args)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8898 int nargs;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8899 Lisp_Object *args;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8900 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8901 Lisp_Object operation, target_idx, target, val;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8902 register Lisp_Object chain;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8903
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8904 if (nargs < 2)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8905 error ("Too few arguments");
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8906 operation = args[0];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8907 if (!SYMBOLP (operation)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8908 || !INTEGERP (target_idx = Fget (operation, Qtarget_idx)))
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
8909 error ("Invalid first argument");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8910 if (nargs < 1 + XINT (target_idx))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8911 error ("Too few arguments for operation: %s",
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8912 SDATA (SYMBOL_NAME (operation)));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8913 target = args[XINT (target_idx) + 1];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8914 if (!(STRINGP (target)
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8915 || (EQ (operation, Qinsert_file_contents) && CONSP (target)
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8916 && STRINGP (XCAR (target)) && BUFFERP (XCDR (target)))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8917 || (EQ (operation, Qopen_network_stream) && INTEGERP (target))))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8918 error ("Invalid %dth argument", XINT (target_idx) + 1);
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8919 if (CONSP (target))
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
8920 target = XCAR (target);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8921
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
8922 chain = ((EQ (operation, Qinsert_file_contents)
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
8923 || EQ (operation, Qwrite_region))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8924 ? Vfile_coding_system_alist
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
8925 : (EQ (operation, Qopen_network_stream)
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8926 ? Vnetwork_coding_system_alist
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8927 : Vprocess_coding_system_alist));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8928 if (NILP (chain))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8929 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8930
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8931 for (; CONSP (chain); chain = XCDR (chain))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8932 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
8933 Lisp_Object elt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8934
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8935 elt = XCAR (chain);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8936 if (CONSP (elt)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8937 && ((STRINGP (target)
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8938 && STRINGP (XCAR (elt))
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8939 && fast_string_match (XCAR (elt), target) >= 0)
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8940 || (INTEGERP (target) && EQ (target, XCAR (elt)))))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8941 {
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
8942 val = XCDR (elt);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8943 /* Here, if VAL is both a valid coding system and a valid
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8944 function symbol, we return VAL as a coding system. */
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8945 if (CONSP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8946 return val;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8947 if (! SYMBOLP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8948 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8949 if (! NILP (Fcoding_system_p (val)))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8950 return Fcons (val, val);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8951 if (! NILP (Ffboundp (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8952 {
72188
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
8953 /* We use call1 rather than safe_call1
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
8954 so as to get bug reports about functions called here
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
8955 which don't handle the current interface. */
72180
f3bc55b96df5 (Ffind_operation_coding_system): Revert the change from 2006-05-29.
Eli Zaretskii <eliz@gnu.org>
parents: 71972
diff changeset
8956 val = call1 (val, Flist (nargs, args));
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8957 if (CONSP (val))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8958 return val;
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8959 if (SYMBOLP (val) && ! NILP (Fcoding_system_p (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8960 return Fcons (val, val);
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
8961 }
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8962 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
8963 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8964 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8965 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8966 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8967
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8968 DEFUN ("set-coding-system-priority", Fset_coding_system_priority,
88845
64b8f6168269 (Fset_coding_system_priority): Allow null arg list.
Dave Love <fx@gnu.org>
parents: 88771
diff changeset
8969 Sset_coding_system_priority, 0, MANY, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
8970 doc: /* Assign higher priority to the coding systems given as arguments.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8971 If multiple coding systems belong to the same category,
89519
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
8972 all but the first one are ignored.
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
8973
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8974 usage: (set-coding-system-priority &rest coding-systems) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8975 (nargs, args)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8976 int nargs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8977 Lisp_Object *args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8978 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8979 int i, j;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8980 int changed[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8981 enum coding_category priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8982
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8983 bzero (changed, sizeof changed);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8984
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8985 for (i = j = 0; i < nargs; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8986 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8987 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8988 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8989
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8990 CHECK_CODING_SYSTEM_GET_SPEC (args[i], spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8991 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8992 category = XINT (CODING_ATTR_CATEGORY (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8993 if (changed[category])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8994 /* Ignore this coding system because a coding system of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8995 same category already had a higher priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8996 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8997 changed[category] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8998 priorities[j++] = category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8999 if (coding_categories[category].id >= 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9000 && ! EQ (args[i], CODING_ID_NAME (coding_categories[category].id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9001 setup_coding_system (args[i], &coding_categories[category]);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9002 Fset (AREF (Vcoding_category_table, category), args[i]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9003 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9005 /* Now we have decided top J priorities. Reflect the order of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9006 original priorities to the remaining priorities. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9007
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9008 for (i = j, j = 0; i < coding_category_max; i++, j++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9009 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9010 while (j < coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9011 && changed[coding_priorities[j]])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9012 j++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9013 if (j == coding_category_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9014 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9015 priorities[i] = coding_priorities[j];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9016 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9017
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9018 bcopy (priorities, coding_priorities, sizeof priorities);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9019
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9020 /* Update `coding-category-list'. */
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9021 Vcoding_category_list = Qnil;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9022 for (i = coding_category_max - 1; i >= 0; i--)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9023 Vcoding_category_list
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9024 = Fcons (AREF (Vcoding_category_table, priorities[i]),
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9025 Vcoding_category_list);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9026
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9027 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9028 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9029
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9030 DEFUN ("coding-system-priority-list", Fcoding_system_priority_list,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9031 Scoding_system_priority_list, 0, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9032 doc: /* Return a list of coding systems ordered by their priorities.
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9033 HIGHESTP non-nil means just return the highest priority one. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9034 (highestp)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9035 Lisp_Object highestp;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9036 {
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9037 int i;
22954
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9038 Lisp_Object val;
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9039
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9040 for (i = 0, val = Qnil; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9041 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9042 enum coding_category category = coding_priorities[i];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9043 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9044 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9045
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9046 if (id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9047 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9048 attrs = CODING_ID_ATTRS (id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9049 if (! NILP (highestp))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9050 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9051 val = Fcons (CODING_ATTR_BASE_NAME (attrs), val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9052 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9053 return Fnreverse (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9054 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9055
88631
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
9056 static char *suffixes[] = { "-unix", "-dos", "-mac" };
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
9057
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9058 static Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9059 make_subsidiaries (base)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9060 Lisp_Object base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9061 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9062 Lisp_Object subsidiaries;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9063 int base_name_len = SBYTES (SYMBOL_NAME (base));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9064 char *buf = (char *) alloca (base_name_len + 6);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9065 int i;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9066
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9067 bcopy (SDATA (SYMBOL_NAME (base)), buf, base_name_len);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9068 subsidiaries = Fmake_vector (make_number (3), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9069 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9070 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9071 bcopy (suffixes[i], buf + base_name_len, strlen (suffixes[i]) + 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9072 ASET (subsidiaries, i, intern (buf));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9073 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9074 return subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9075 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9076
22226
557fac086b1b (ascii_skip_code): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22186
diff changeset
9077
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9078 DEFUN ("define-coding-system-internal", Fdefine_coding_system_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9079 Sdefine_coding_system_internal, coding_arg_max, MANY, 0,
88544
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9080 doc: /* For internal use only.
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9081 usage: (define-coding-system-internal ...) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9082 (nargs, args)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9083 int nargs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9084 Lisp_Object *args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9085 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9086 Lisp_Object name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9087 Lisp_Object spec_vec; /* [ ATTRS ALIASE EOL_TYPE ] */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9088 Lisp_Object attrs; /* Vector of attributes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9089 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9090 Lisp_Object aliases;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9091 Lisp_Object coding_type, charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9092 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9093 Lisp_Object tail, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9094 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9095 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9096
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9097 if (nargs < coding_arg_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9098 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9099
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9100 attrs = Fmake_vector (make_number (coding_attr_last_index), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9101
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9102 name = args[coding_arg_name];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9103 CHECK_SYMBOL (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9104 CODING_ATTR_BASE_NAME (attrs) = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9105
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9106 val = args[coding_arg_mnemonic];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9107 if (! STRINGP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9108 CHECK_CHARACTER (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9109 CODING_ATTR_MNEMONIC (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9110
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9111 coding_type = args[coding_arg_coding_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9112 CHECK_SYMBOL (coding_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9113 CODING_ATTR_TYPE (attrs) = coding_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9114
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9115 charset_list = args[coding_arg_charset_list];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9116 if (SYMBOLP (charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9117 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9118 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9119 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9120 if (! EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9121 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9122 charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9123 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9124 else if (EQ (charset_list, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9125 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9126 if (! EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9127 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9128 charset_list = Vemacs_mule_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9129 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9130 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9131 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9132 max_charset_id = XFASTINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9133 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9134 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9135 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9136 charset_list = Fcopy_sequence (charset_list);
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9137 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9138 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9139 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9140
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9141 val = XCAR (tail);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9142 CHECK_CHARSET_GET_CHARSET (val, charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9143 if (EQ (coding_type, Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9144 ? CHARSET_ISO_FINAL (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9145 : EQ (coding_type, Qemacs_mule)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9146 ? CHARSET_EMACS_MULE_ID (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9147 : 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9148 error ("Can't handle charset `%s'",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9149 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9150
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9151 XSETCAR (tail, make_number (charset->id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9152 if (max_charset_id < charset->id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9153 max_charset_id = charset->id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9154 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9155 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9156 CODING_ATTR_CHARSET_LIST (attrs) = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9157
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9158 safe_charsets = Fmake_string (make_number (max_charset_id + 1),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9159 make_number (255));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9160 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9161 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9162 CODING_ATTR_SAFE_CHARSETS (attrs) = safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9163
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9164 CODING_ATTR_ASCII_COMPAT (attrs) = args[coding_arg_ascii_compatible_p];
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9165
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9166 val = args[coding_arg_decode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9167 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9168 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9169 CODING_ATTR_DECODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9170
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9171 val = args[coding_arg_encode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9172 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9173 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9174 CODING_ATTR_ENCODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9175
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9176 val = args[coding_arg_post_read_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9177 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9178 CODING_ATTR_POST_READ (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9179
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9180 val = args[coding_arg_pre_write_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9181 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9182 CODING_ATTR_PRE_WRITE (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9183
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9184 val = args[coding_arg_default_char];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9185 if (NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9186 CODING_ATTR_DEFAULT_CHAR (attrs) = make_number (' ');
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9187 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9188 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9189 CHECK_CHARACTER (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9190 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9191 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9192
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9193 val = args[coding_arg_for_unibyte];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9194 CODING_ATTR_FOR_UNIBYTE (attrs) = NILP (val) ? Qnil : Qt;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9195
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9196 val = args[coding_arg_plist];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9197 CHECK_LIST (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9198 CODING_ATTR_PLIST (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9199
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9200 if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9201 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9202 /* Generate a lisp vector of 256 elements. Each element is nil,
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9203 integer, or a list of charset IDs.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9204
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9205 If Nth element is nil, the byte code N is invalid in this
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9206 coding system.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9207
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9208 If Nth element is a number NUM, N is the first byte of a
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9209 charset whose ID is NUM.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9210
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9211 If Nth element is a list of charset IDs, N is the first byte
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9212 of one of them. The list is sorted by dimensions of the
89648
d5641a606e08 (Fdefine_coding_system_internal): Fix checking of ascii compatibility.
Kenichi Handa <handa@m17n.org>
parents: 89644
diff changeset
9213 charsets. A charset of smaller dimension comes firtst. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9214 val = Fmake_vector (make_number (256), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9215
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9216 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9217 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9218 struct charset *charset = CHARSET_FROM_ID (XFASTINT (XCAR (tail)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9219 int dim = CHARSET_DIMENSION (charset);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9220 int idx = (dim - 1) * 4;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9221
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9222 if (CHARSET_ASCII_COMPATIBLE_P (charset))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9223 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9224
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9225 for (i = charset->code_space[idx];
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9226 i <= charset->code_space[idx + 1]; i++)
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9227 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9228 Lisp_Object tmp, tmp2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9229 int dim2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9230
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9231 tmp = AREF (val, i);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9232 if (NILP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9233 tmp = XCAR (tail);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9234 else if (NUMBERP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9235 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9236 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (tmp)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9237 if (dim < dim2)
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9238 tmp = Fcons (XCAR (tail), Fcons (tmp, Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9239 else
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9240 tmp = Fcons (tmp, Fcons (XCAR (tail), Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9241 }
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9242 else
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9243 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9244 for (tmp2 = tmp; CONSP (tmp2); tmp2 = XCDR (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9245 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9246 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (XCAR (tmp2))));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9247 if (dim < dim2)
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9248 break;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9249 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9250 if (NILP (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9251 tmp = nconc2 (tmp, Fcons (XCAR (tail), Qnil));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9252 else
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9253 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9254 XSETCDR (tmp2, Fcons (XCAR (tmp2), XCDR (tmp2)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9255 XSETCAR (tmp2, XCAR (tail));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9256 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9257 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9258 ASET (val, i, tmp);
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9259 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9260 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9261 ASET (attrs, coding_attr_charset_valids, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9262 category = coding_category_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9263 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9264 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9265 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9266 Lisp_Object valids;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9267
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9268 if (nargs < coding_arg_ccl_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9269 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9270
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9271 val = args[coding_arg_ccl_decoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9272 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9273 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9274 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9275 ASET (attrs, coding_attr_ccl_decoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9276
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9277 val = args[coding_arg_ccl_encoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9278 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9279 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9280 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9281 ASET (attrs, coding_attr_ccl_encoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9282
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9283 val = args[coding_arg_ccl_valids];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9284 valids = Fmake_string (make_number (256), make_number (0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9285 for (tail = val; !NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9286 {
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9287 int from, to;
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9288
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9289 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9290 if (INTEGERP (val))
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9291 {
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9292 from = to = XINT (val);
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9293 if (from < 0 || from > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9294 args_out_of_range_3 (val, make_number (0), make_number (255));
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9295 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9296 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9297 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9298 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9299 CHECK_NATNUM_CAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9300 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9301 from = XINT (XCAR (val));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9302 if (from > 255)
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9303 args_out_of_range_3 (XCAR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9304 make_number (0), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9305 to = XINT (XCDR (val));
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9306 if (to < from || to > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9307 args_out_of_range_3 (XCDR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9308 XCAR (val), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9309 }
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9310 for (i = from; i <= to; i++)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9311 SSET (valids, i, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9312 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9313 ASET (attrs, coding_attr_ccl_valids, valids);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9314
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9315 category = coding_category_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9316 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9317 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9318 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9319 Lisp_Object bom, endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9320
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9321 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9322
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9323 if (nargs < coding_arg_utf16_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9324 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9325
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9326 bom = args[coding_arg_utf16_bom];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9327 if (! NILP (bom) && ! EQ (bom, Qt))
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9328 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9329 CHECK_CONS (bom);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9330 val = XCAR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9331 CHECK_CODING_SYSTEM (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9332 val = XCDR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9333 CHECK_CODING_SYSTEM (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9334 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9335 ASET (attrs, coding_attr_utf_bom, bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9336
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9337 endian = args[coding_arg_utf16_endian];
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9338 CHECK_SYMBOL (endian);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9339 if (NILP (endian))
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9340 endian = Qbig;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9341 else if (! EQ (endian, Qbig) && ! EQ (endian, Qlittle))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9342 error ("Invalid endian: %s", SDATA (SYMBOL_NAME (endian)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9343 ASET (attrs, coding_attr_utf_16_endian, endian);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9344
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9345 category = (CONSP (bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9346 ? coding_category_utf_16_auto
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9347 : NILP (bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9348 ? (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9349 ? coding_category_utf_16_be_nosig
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9350 : coding_category_utf_16_le_nosig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9351 : (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9352 ? coding_category_utf_16_be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9353 : coding_category_utf_16_le));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9354 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9355 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9356 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9357 Lisp_Object initial, reg_usage, request, flags;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
9358 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9359
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9360 if (nargs < coding_arg_iso2022_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9361 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9362
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9363 initial = Fcopy_sequence (args[coding_arg_iso2022_initial]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9364 CHECK_VECTOR (initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9365 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9366 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9367 val = Faref (initial, make_number (i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9368 if (! NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9369 {
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9370 struct charset *charset;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9371
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9372 CHECK_CHARSET_GET_CHARSET (val, charset);
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9373 ASET (initial, i, make_number (CHARSET_ID (charset)));
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9374 if (i == 0 && CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9375 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9376 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9377 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9378 ASET (initial, i, make_number (-1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9379 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9380
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9381 reg_usage = args[coding_arg_iso2022_reg_usage];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9382 CHECK_CONS (reg_usage);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9383 CHECK_NUMBER_CAR (reg_usage);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9384 CHECK_NUMBER_CDR (reg_usage);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9385
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9386 request = Fcopy_sequence (args[coding_arg_iso2022_request]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9387 for (tail = request; ! NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9388 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9389 int id;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9390 Lisp_Object tmp;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9391
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9392 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9393 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9394 tmp = XCAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9395 CHECK_CHARSET_GET_ID (tmp, id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9396 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9397 if (XINT (XCDR (val)) >= 4)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9398 error ("Invalid graphic register number: %d", XINT (XCDR (val)));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9399 XSETCAR (val, make_number (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9400 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9401
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9402 flags = args[coding_arg_iso2022_flags];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9403 CHECK_NATNUM (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9404 i = XINT (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9405 if (EQ (args[coding_arg_charset_list], Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9406 flags = make_number (i | CODING_ISO_FLAG_FULL_SUPPORT);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9407
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9408 ASET (attrs, coding_attr_iso_initial, initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9409 ASET (attrs, coding_attr_iso_usage, reg_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9410 ASET (attrs, coding_attr_iso_request, request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9411 ASET (attrs, coding_attr_iso_flags, flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9412 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9413
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9414 if (i & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9415 category = ((i & (CODING_ISO_FLAG_LOCKING_SHIFT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9416 | CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9417 ? coding_category_iso_7_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9418 : EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9419 ? coding_category_iso_7
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9420 : coding_category_iso_7_tight);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9421 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9422 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9423 int id = XINT (AREF (initial, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9424
88977
3b05c02eebf2 (Fdefine_coding_system_internal): Fix category setting
Kenichi Handa <handa@m17n.org>
parents: 88950
diff changeset
9425 category = (((i & CODING_ISO_FLAG_LOCKING_SHIFT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9426 || EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9427 || id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9428 ? coding_category_iso_8_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9429 : (CHARSET_DIMENSION (CHARSET_FROM_ID (id)) == 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9430 ? coding_category_iso_8_1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9431 : coding_category_iso_8_2);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9432 }
89227
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9433 if (category != coding_category_iso_8_1
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9434 && category != coding_category_iso_8_2)
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9435 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9436 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9437 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9438 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9439 if (EQ (args[coding_arg_charset_list], Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9440 ASET (attrs, coding_attr_emacs_mule_full, Qt);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9441 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9442 category = coding_category_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9443 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9444 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9445 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9446
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9447 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9448
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9449 if (XINT (Flength (charset_list)) != 3
89739
293c9235be3f (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89732
diff changeset
9450 && XINT (Flength (charset_list)) != 4)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9451 error ("There should be three or four charsets");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9452
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9453 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9454 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9455 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9456 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9457 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9458 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9459
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9460 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9461 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9462 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9463 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9464 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9465
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9466 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9467 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9468 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9469 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9470 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9471
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9472 charset_list = XCDR (charset_list);
89740
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9473 if (! NILP (charset_list))
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9474 {
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9475 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9476 if (CHARSET_DIMENSION (charset) != 2)
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9477 error ("Dimension of charset %s is not two",
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9478 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
9479 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9480
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9481 category = coding_category_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9482 Vsjis_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9483 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9484 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9485 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9486 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9487
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9488 if (XINT (Flength (charset_list)) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9489 error ("There should be just two charsets");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9490
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9491 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9492 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9493 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9494 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9495 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9496 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9497
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9498 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9499 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9500 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9501 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9502 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9503
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9504 category = coding_category_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9505 Vbig5_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9506 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9507 else if (EQ (coding_type, Qraw_text))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9508 {
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9509 category = coding_category_raw_text;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9510 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9511 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9512 else if (EQ (coding_type, Qutf_8))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9513 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9514 Lisp_Object bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9515
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9516 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9517
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9518 if (nargs < coding_arg_utf8_max)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9519 goto short_args;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9520
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9521 bom = args[coding_arg_utf8_bom];
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9522 if (! NILP (bom) && ! EQ (bom, Qt))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9523 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9524 CHECK_CONS (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9525 val = XCAR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9526 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9527 val = XCDR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9528 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9529 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9530 ASET (attrs, coding_attr_utf_bom, bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9531
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9532 category = (CONSP (bom) ? coding_category_utf_8_auto
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9533 : NILP (bom) ? coding_category_utf_8_nosig
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9534 : coding_category_utf_8_sig);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9535 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9536 else if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9537 category = coding_category_undecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9538 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9539 error ("Invalid coding system type: %s",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9540 SDATA (SYMBOL_NAME (coding_type)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9541
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9542 CODING_ATTR_CATEGORY (attrs) = make_number (category);
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
9543 CODING_ATTR_PLIST (attrs)
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
9544 = Fcons (QCcategory, Fcons (AREF (Vcoding_category_table, category),
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
9545 CODING_ATTR_PLIST (attrs)));
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9546 CODING_ATTR_PLIST (attrs)
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
9547 = Fcons (QCascii_compatible_p,
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9548 Fcons (CODING_ATTR_ASCII_COMPAT (attrs),
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9549 CODING_ATTR_PLIST (attrs)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9550
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9551 eol_type = args[coding_arg_eol_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9552 if (! NILP (eol_type)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9553 && ! EQ (eol_type, Qunix)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9554 && ! EQ (eol_type, Qdos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9555 && ! EQ (eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9556 error ("Invalid eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9557
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9558 aliases = Fcons (name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9559
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9560 if (NILP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9561 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9562 eol_type = make_subsidiaries (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9563 for (i = 0; i < 3; i++)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9564 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9565 Lisp_Object this_spec, this_name, this_aliases, this_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9566
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9567 this_name = AREF (eol_type, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9568 this_aliases = Fcons (this_name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9569 this_eol_type = (i == 0 ? Qunix : i == 1 ? Qdos : Qmac);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9570 this_spec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9571 ASET (this_spec, 1, this_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9572 ASET (this_spec, 2, this_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9573 Fputhash (this_name, this_spec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9574 Vcoding_system_list = Fcons (this_name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9575 val = Fassoc (Fsymbol_name (this_name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9576 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9577 Vcoding_system_alist
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9578 = Fcons (Fcons (Fsymbol_name (this_name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9579 Vcoding_system_alist);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9580 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9581 }
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9582
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9583 spec_vec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9584 ASET (spec_vec, 1, aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9585 ASET (spec_vec, 2, eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9586
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9587 Fputhash (name, spec_vec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9588 Vcoding_system_list = Fcons (name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9589 val = Fassoc (Fsymbol_name (name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9590 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9591 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9592 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9593
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9594 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9595 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9596
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9597 if (id < 0 || EQ (name, CODING_ID_NAME (id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9598 setup_coding_system (name, &coding_categories[category]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9599 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9600
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9601 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9602
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9603 short_args:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9604 return Fsignal (Qwrong_number_of_arguments,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9605 Fcons (intern ("define-coding-system-internal"),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9606 make_number (nargs)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9607 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9608
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
9609
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9610 DEFUN ("coding-system-put", Fcoding_system_put, Scoding_system_put,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9611 3, 3, 0,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9612 doc: /* Change value in CODING-SYSTEM's property list PROP to VAL. */)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9613 (coding_system, prop, val)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9614 Lisp_Object coding_system, prop, val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9615 {
89924
7d0f6da3ea6e (detect_coding): Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 89917
diff changeset
9616 Lisp_Object spec, attrs;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9617
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9618 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9619 attrs = AREF (spec, 0);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9620 if (EQ (prop, QCmnemonic))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9621 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9622 if (! STRINGP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9623 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9624 CODING_ATTR_MNEMONIC (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9625 }
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
9626 else if (EQ (prop, QCdefault_char))
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9627 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9628 if (NILP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9629 val = make_number (' ');
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9630 else
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9631 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9632 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9633 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9634 else if (EQ (prop, QCdecode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9635 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9636 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9637 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9638 CODING_ATTR_DECODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9639 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9640 else if (EQ (prop, QCencode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9641 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9642 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9643 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9644 CODING_ATTR_ENCODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9645 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9646 else if (EQ (prop, QCpost_read_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9647 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9648 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9649 CODING_ATTR_POST_READ (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9650 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9651 else if (EQ (prop, QCpre_write_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9652 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9653 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9654 CODING_ATTR_PRE_WRITE (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9655 }
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9656 else if (EQ (prop, QCascii_compatible_p))
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9657 {
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9658 CODING_ATTR_ASCII_COMPAT (attrs) = val;
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9659 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9660
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9661 CODING_ATTR_PLIST (attrs)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9662 = Fplist_put (CODING_ATTR_PLIST (attrs), prop, val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9663 return val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9664 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9665
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9666
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9667 DEFUN ("define-coding-system-alias", Fdefine_coding_system_alias,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9668 Sdefine_coding_system_alias, 2, 2, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9669 doc: /* Define ALIAS as an alias for CODING-SYSTEM. */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9670 (alias, coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9671 Lisp_Object alias, coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9672 {
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9673 Lisp_Object spec, aliases, eol_type, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9674
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9675 CHECK_SYMBOL (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9676 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9677 aliases = AREF (spec, 1);
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9678 /* ALIASES should be a list of length more than zero, and the first
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
9679 element is a base coding system. Append ALIAS at the tail of the
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
9680 list. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9681 while (!NILP (XCDR (aliases)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9682 aliases = XCDR (aliases);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9683 XSETCDR (aliases, Fcons (alias, Qnil));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9684
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9685 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9686 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9687 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9688 Lisp_Object subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9689 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9691 subsidiaries = make_subsidiaries (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9692 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9693 Fdefine_coding_system_alias (AREF (subsidiaries, i),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9694 AREF (eol_type, i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9695 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9696
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9697 Fputhash (alias, spec, Vcoding_system_hash_table);
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
9698 Vcoding_system_list = Fcons (alias, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9699 val = Fassoc (Fsymbol_name (alias), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9700 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9701 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (alias), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
9702 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9703
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9704 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9705 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9706
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9707 DEFUN ("coding-system-base", Fcoding_system_base, Scoding_system_base,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9708 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9709 doc: /* Return the base of CODING-SYSTEM.
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9710 Any alias or subsidiary coding system is not a base coding system. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9711 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9712 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9713 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9714 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9715
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9716 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9717 return (Qno_conversion);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9718 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9719 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9720 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9721 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9722
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9723 DEFUN ("coding-system-plist", Fcoding_system_plist, Scoding_system_plist,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9724 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9725 doc: "Return the property list of CODING-SYSTEM.")
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9726 (coding_system)
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9727 Lisp_Object coding_system;
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9728 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9729 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9730
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9731 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9732 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9733 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9734 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9735 return CODING_ATTR_PLIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9736 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9737
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9738
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9739 DEFUN ("coding-system-aliases", Fcoding_system_aliases, Scoding_system_aliases,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9740 1, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9741 doc: /* Return the list of aliases of CODING-SYSTEM. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9742 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9743 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9744 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9745 Lisp_Object spec;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9746
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9747 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9748 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9749 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9750 return AREF (spec, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9751 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9752
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9753 DEFUN ("coding-system-eol-type", Fcoding_system_eol_type,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9754 Scoding_system_eol_type, 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9755 doc: /* Return eol-type of CODING-SYSTEM.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9756 An eol-type is an integer 0, 1, 2, or a vector of coding systems.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9757
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9758 Integer values 0, 1, and 2 indicate a format of end-of-line; LF, CRLF,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9759 and CR respectively.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9760
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9761 A vector value indicates that a format of end-of-line should be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9762 detected automatically. Nth element of the vector is the subsidiary
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9763 coding system whose eol-type is N. */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9764 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9765 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9766 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9767 Lisp_Object spec, eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9768 int n;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9769
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9770 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9771 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9772 if (! CODING_SYSTEM_P (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9773 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9774 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9775 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9776 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9777 return Fcopy_sequence (eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9778 n = EQ (eol_type, Qunix) ? 0 : EQ (eol_type, Qdos) ? 1 : 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9779 return make_number (n);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9780 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9781
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9782 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9783
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9784
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9785 /*** 9. Post-amble ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9786
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
9787 void
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9788 init_coding_once ()
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9789 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9790 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9791
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9792 for (i = 0; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9793 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9794 coding_categories[i].id = -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9795 coding_priorities[i] = i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9796 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9797
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9798 /* ISO2022 specific initialize routine. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9799 for (i = 0; i < 0x20; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9800 iso_code_class[i] = ISO_control_0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9801 for (i = 0x21; i < 0x7F; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9802 iso_code_class[i] = ISO_graphic_plane_0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9803 for (i = 0x80; i < 0xA0; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9804 iso_code_class[i] = ISO_control_1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9805 for (i = 0xA1; i < 0xFF; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9806 iso_code_class[i] = ISO_graphic_plane_1;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9807 iso_code_class[0x20] = iso_code_class[0x7F] = ISO_0x20_or_0x7F;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9808 iso_code_class[0xA0] = iso_code_class[0xFF] = ISO_0xA0_or_0xFF;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9809 iso_code_class[ISO_CODE_SO] = ISO_shift_out;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9810 iso_code_class[ISO_CODE_SI] = ISO_shift_in;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9811 iso_code_class[ISO_CODE_SS2_7] = ISO_single_shift_2_7;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9812 iso_code_class[ISO_CODE_ESC] = ISO_escape;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9813 iso_code_class[ISO_CODE_SS2] = ISO_single_shift_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9814 iso_code_class[ISO_CODE_SS3] = ISO_single_shift_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9815 iso_code_class[ISO_CODE_CSI] = ISO_control_sequence_introducer;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9816
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9817 for (i = 0; i < 256; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9818 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9819 emacs_mule_bytes[i] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9820 }
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
9821 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_11] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
9822 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_12] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
9823 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_21] = 4;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
9824 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_22] = 4;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9825 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9826
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9827 #ifdef emacs
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9828
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
9829 void
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9830 syms_of_coding ()
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9831 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9832 staticpro (&Vcoding_system_hash_table);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9833 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9834 Lisp_Object args[2];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9835 args[0] = QCtest;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9836 args[1] = Qeq;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9837 Vcoding_system_hash_table = Fmake_hash_table (2, args);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9838 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9839
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9840 staticpro (&Vsjis_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9841 Vsjis_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9842
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9843 staticpro (&Vbig5_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9844 Vbig5_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9845
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
9846 staticpro (&Vcode_conversion_reused_workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
9847 Vcode_conversion_reused_workbuf = Qnil;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
9848
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
9849 staticpro (&Vcode_conversion_workbuf_name);
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
9850 Vcode_conversion_workbuf_name = build_string (" *code-conversion-work*");
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
9851
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
9852 reused_workbuf_in_use = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9853
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9854 DEFSYM (Qcharset, "charset");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9855 DEFSYM (Qtarget_idx, "target-idx");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9856 DEFSYM (Qcoding_system_history, "coding-system-history");
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
9857 Fset (Qcoding_system_history, Qnil);
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
9858
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9859 /* Target FILENAME is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9860 Fput (Qinsert_file_contents, Qtarget_idx, make_number (0));
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9861 /* Target FILENAME is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9862 Fput (Qwrite_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9863
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9864 DEFSYM (Qcall_process, "call-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9865 /* Target PROGRAM is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9866 Fput (Qcall_process, Qtarget_idx, make_number (0));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9867
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9868 DEFSYM (Qcall_process_region, "call-process-region");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9869 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9870 Fput (Qcall_process_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9871
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9872 DEFSYM (Qstart_process, "start-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9873 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9874 Fput (Qstart_process, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9875
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9876 DEFSYM (Qopen_network_stream, "open-network-stream");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9877 /* Target SERVICE is the fourth argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9878 Fput (Qopen_network_stream, Qtarget_idx, make_number (3));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
9879
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9880 DEFSYM (Qcoding_system, "coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9881 DEFSYM (Qcoding_aliases, "coding-aliases");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9882
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9883 DEFSYM (Qeol_type, "eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9884 DEFSYM (Qunix, "unix");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9885 DEFSYM (Qdos, "dos");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9886
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9887 DEFSYM (Qbuffer_file_coding_system, "buffer-file-coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9888 DEFSYM (Qpost_read_conversion, "post-read-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9889 DEFSYM (Qpre_write_conversion, "pre-write-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9890 DEFSYM (Qdefault_char, "default-char");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9891 DEFSYM (Qundecided, "undecided");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9892 DEFSYM (Qno_conversion, "no-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9893 DEFSYM (Qraw_text, "raw-text");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9894
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9895 DEFSYM (Qiso_2022, "iso-2022");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9896
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9897 DEFSYM (Qutf_8, "utf-8");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9898 DEFSYM (Qutf_8_emacs, "utf-8-emacs");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9899
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9900 DEFSYM (Qutf_16, "utf-16");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9901 DEFSYM (Qbig, "big");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9902 DEFSYM (Qlittle, "little");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9903
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9904 DEFSYM (Qshift_jis, "shift-jis");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9905 DEFSYM (Qbig5, "big5");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9906
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9907 DEFSYM (Qcoding_system_p, "coding-system-p");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9908
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9909 DEFSYM (Qcoding_system_error, "coding-system-error");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9910 Fput (Qcoding_system_error, Qerror_conditions,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9911 Fcons (Qcoding_system_error, Fcons (Qerror, Qnil)));
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9912 Fput (Qcoding_system_error, Qerror_message,
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
9913 build_string ("Invalid coding system"));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9914
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
9915 /* Intern this now in case it isn't already done.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
9916 Setting this variable twice is harmless.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
9917 But don't staticpro it here--that is done in alloc.c. */
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
9918 Qchar_table_extra_slots = intern ("char-table-extra-slots");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9919
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9920 DEFSYM (Qtranslation_table, "translation-table");
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
9921 Fput (Qtranslation_table, Qchar_table_extra_slots, make_number (2));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9922 DEFSYM (Qtranslation_table_id, "translation-table-id");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9923 DEFSYM (Qtranslation_table_for_decode, "translation-table-for-decode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9924 DEFSYM (Qtranslation_table_for_encode, "translation-table-for-encode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9925
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9926 DEFSYM (Qvalid_codes, "valid-codes");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9927
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9928 DEFSYM (Qemacs_mule, "emacs-mule");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9929
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
9930 DEFSYM (QCcategory, ":category");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9931 DEFSYM (QCmnemonic, ":mnemonic");
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
9932 DEFSYM (QCdefault_char, ":default-char");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9933 DEFSYM (QCdecode_translation_table, ":decode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9934 DEFSYM (QCencode_translation_table, ":encode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9935 DEFSYM (QCpost_read_conversion, ":post-read-conversion");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9936 DEFSYM (QCpre_write_conversion, ":pre-write-conversion");
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
9937 DEFSYM (QCascii_compatible_p, ":ascii-compatible-p");
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
9938
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9939 Vcoding_category_table
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9940 = Fmake_vector (make_number (coding_category_max), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9941 staticpro (&Vcoding_category_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9942 /* Followings are target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9943 ASET (Vcoding_category_table, coding_category_iso_7,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9944 intern ("coding-category-iso-7"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9945 ASET (Vcoding_category_table, coding_category_iso_7_tight,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9946 intern ("coding-category-iso-7-tight"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9947 ASET (Vcoding_category_table, coding_category_iso_8_1,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9948 intern ("coding-category-iso-8-1"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9949 ASET (Vcoding_category_table, coding_category_iso_8_2,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9950 intern ("coding-category-iso-8-2"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9951 ASET (Vcoding_category_table, coding_category_iso_7_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9952 intern ("coding-category-iso-7-else"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9953 ASET (Vcoding_category_table, coding_category_iso_8_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9954 intern ("coding-category-iso-8-else"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9955 ASET (Vcoding_category_table, coding_category_utf_8_auto,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9956 intern ("coding-category-utf-8-auto"));
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9957 ASET (Vcoding_category_table, coding_category_utf_8_nosig,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9958 intern ("coding-category-utf-8"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9959 ASET (Vcoding_category_table, coding_category_utf_8_sig,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9960 intern ("coding-category-utf-8-sig"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9961 ASET (Vcoding_category_table, coding_category_utf_16_be,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9962 intern ("coding-category-utf-16-be"));
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9963 ASET (Vcoding_category_table, coding_category_utf_16_auto,
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9964 intern ("coding-category-utf-16-auto"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9965 ASET (Vcoding_category_table, coding_category_utf_16_le,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9966 intern ("coding-category-utf-16-le"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9967 ASET (Vcoding_category_table, coding_category_utf_16_be_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9968 intern ("coding-category-utf-16-be-nosig"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9969 ASET (Vcoding_category_table, coding_category_utf_16_le_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9970 intern ("coding-category-utf-16-le-nosig"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9971 ASET (Vcoding_category_table, coding_category_charset,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9972 intern ("coding-category-charset"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9973 ASET (Vcoding_category_table, coding_category_sjis,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9974 intern ("coding-category-sjis"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9975 ASET (Vcoding_category_table, coding_category_big5,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9976 intern ("coding-category-big5"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9977 ASET (Vcoding_category_table, coding_category_ccl,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9978 intern ("coding-category-ccl"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9979 ASET (Vcoding_category_table, coding_category_emacs_mule,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9980 intern ("coding-category-emacs-mule"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9981 /* Followings are NOT target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9982 ASET (Vcoding_category_table, coding_category_raw_text,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9983 intern ("coding-category-raw-text"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9984 ASET (Vcoding_category_table, coding_category_undecided,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9985 intern ("coding-category-undecided"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9986
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
9987 DEFSYM (Qinsufficient_source, "insufficient-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
9988 DEFSYM (Qinconsistent_eol, "inconsistent-eol");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
9989 DEFSYM (Qinvalid_source, "invalid-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
9990 DEFSYM (Qinterrupted, "interrupted");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
9991 DEFSYM (Qinsufficient_memory, "insufficient-memory");
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
9992 DEFSYM (Qcoding_system_define_form, "coding-system-define-form");
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
9993
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9994 defsubr (&Scoding_system_p);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9995 defsubr (&Sread_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9996 defsubr (&Sread_non_nil_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9997 defsubr (&Scheck_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9998 defsubr (&Sdetect_coding_region);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9999 defsubr (&Sdetect_coding_string);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10000 defsubr (&Sfind_coding_systems_region_internal);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
10001 defsubr (&Sunencodable_char_position);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10002 defsubr (&Scheck_coding_systems_region);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10003 defsubr (&Sdecode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10004 defsubr (&Sencode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10005 defsubr (&Sdecode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10006 defsubr (&Sencode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10007 defsubr (&Sdecode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10008 defsubr (&Sencode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10009 defsubr (&Sdecode_big5_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10010 defsubr (&Sencode_big5_char);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10011 defsubr (&Sset_terminal_coding_system_internal);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10012 defsubr (&Sset_safe_terminal_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10013 defsubr (&Sterminal_coding_system);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10014 defsubr (&Sset_keyboard_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10015 defsubr (&Skeyboard_coding_system);
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
10016 defsubr (&Sfind_operation_coding_system);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10017 defsubr (&Sset_coding_system_priority);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10018 defsubr (&Sdefine_coding_system_internal);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10019 defsubr (&Sdefine_coding_system_alias);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10020 defsubr (&Scoding_system_put);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10021 defsubr (&Scoding_system_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10022 defsubr (&Scoding_system_plist);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10023 defsubr (&Scoding_system_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10024 defsubr (&Scoding_system_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10025 defsubr (&Scoding_system_priority_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10026
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10027 DEFVAR_LISP ("coding-system-list", &Vcoding_system_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10028 doc: /* List of coding systems.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10029
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10030 Do not alter the value of this variable manually. This variable should be
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10031 updated by the functions `define-coding-system' and
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10032 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10033 Vcoding_system_list = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10034
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10035 DEFVAR_LISP ("coding-system-alist", &Vcoding_system_alist,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10036 doc: /* Alist of coding system names.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10037 Each element is one element list of coding system name.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10038 This variable is given to `completing-read' as COLLECTION argument.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10039
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10040 Do not alter the value of this variable manually. This variable should be
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10041 updated by the functions `make-coding-system' and
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10042 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10043 Vcoding_system_alist = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10044
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10045 DEFVAR_LISP ("coding-category-list", &Vcoding_category_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10046 doc: /* List of coding-categories (symbols) ordered by priority.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10047
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10048 On detecting a coding system, Emacs tries code detection algorithms
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10049 associated with each coding-category one by one in this order. When
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10050 one algorithm agrees with a byte sequence of source text, the coding
60608
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10051 system bound to the corresponding coding-category is selected.
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10052
61166
e3a6dd630fdf (Vcoding_category_list): Docstring fix.
Kenichi Handa <handa@m17n.org>
parents: 60907
diff changeset
10053 Don't modify this variable directly, but use `set-coding-priority'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10054 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10055 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10056
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10057 Vcoding_category_list = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10058 for (i = coding_category_max - 1; i >= 0; i--)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10059 Vcoding_category_list
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10060 = Fcons (XVECTOR (Vcoding_category_table)->contents[i],
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10061 Vcoding_category_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10062 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10063
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10064 DEFVAR_LISP ("coding-system-for-read", &Vcoding_system_for_read,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10065 doc: /* Specify the coding system for read operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10066 It is useful to bind this variable with `let', but do not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10067 If the value is a coding system, it is used for decoding on read operation.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10068 If not, an appropriate element is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10069 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10070 `process-coding-system-alist', and `network-coding-system-alist'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10071 Vcoding_system_for_read = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10072
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10073 DEFVAR_LISP ("coding-system-for-write", &Vcoding_system_for_write,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10074 doc: /* Specify the coding system for write operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10075 Programs bind this variable with `let', but you should not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10076 If the value is a coding system, it is used for encoding of output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10077 when writing it to a file and when sending it to a file or subprocess.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10078
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10079 If this does not specify a coding system, an appropriate element
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10080 is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10081 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10082 `process-coding-system-alist', and `network-coding-system-alist'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10083 For output to files, if the above procedure does not specify a coding system,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10084 the value of `buffer-file-coding-system' is used. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10085 Vcoding_system_for_write = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10086
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10087 DEFVAR_LISP ("last-coding-system-used", &Vlast_coding_system_used,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10088 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10089 Coding system used in the latest file or process I/O. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10090 Vlast_coding_system_used = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10091
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10092 DEFVAR_LISP ("last-code-conversion-error", &Vlast_code_conversion_error,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10093 doc: /*
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10094 Error status of the last code conversion.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10095
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10096 When an error was detected in the last code conversion, this variable
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10097 is set to one of the following symbols.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10098 `insufficient-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10099 `inconsistent-eol'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10100 `invalid-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10101 `interrupted'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10102 `insufficient-memory'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10103 When no error was detected, the value doesn't change. So, to check
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10104 the error status of a code conversion by this variable, you must
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10105 explicitly set this variable to nil before performing code
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10106 conversion. */);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10107 Vlast_code_conversion_error = Qnil;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10108
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10109 DEFVAR_BOOL ("inhibit-eol-conversion", &inhibit_eol_conversion,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10110 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10111 *Non-nil means always inhibit code conversion of end-of-line format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10112 See info node `Coding Systems' and info node `Text and Binary' concerning
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10113 such conversion. */);
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10114 inhibit_eol_conversion = 0;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10115
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10116 DEFVAR_BOOL ("inherit-process-coding-system", &inherit_process_coding_system,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10117 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10118 Non-nil means process buffer inherits coding system of process output.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10119 Bind it to t if the process output is to be treated as if it were a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10120 read from some filesystem. */);
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10121 inherit_process_coding_system = 0;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10122
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10123 DEFVAR_LISP ("file-coding-system-alist", &Vfile_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10124 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10125 Alist to decide a coding system to use for a file I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10126 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10127 where PATTERN is a regular expression matching a file name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10128 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10129 If VAL is a coding system, it is used for both decoding and encoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10130 the file contents.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10131 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10132 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10133 If VAL is a function symbol, the function must return a coding system
72323
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10134 or a cons of coding systems which are used as above. The function is
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10135 called with an argument that is a list of the arguments with which
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10136 `find-operation-coding-system' was called. If the function can't decide
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10137 a coding system, it can return `undecided' so that the normal
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10138 code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10139
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10140 See also the function `find-operation-coding-system'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10141 and the variable `auto-coding-alist'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10142 Vfile_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10143
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10144 DEFVAR_LISP ("process-coding-system-alist", &Vprocess_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10145 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10146 Alist to decide a coding system to use for a process I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10147 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10148 where PATTERN is a regular expression matching a program name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10149 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10150 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10151 from the program and encoding what sent to the program.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10152 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10153 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10154 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10155 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10156
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10157 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10158 Vprocess_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10159
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10160 DEFVAR_LISP ("network-coding-system-alist", &Vnetwork_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10161 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10162 Alist to decide a coding system to use for a network I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10163 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10164 where PATTERN is a regular expression matching a network service name
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10165 or is a port number to connect to,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10166 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10167 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10168 from the network stream and encoding what sent to the network stream.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10169 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10170 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10171 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10172 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10173
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10174 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10175 Vnetwork_coding_system_alist = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10176
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10177 DEFVAR_LISP ("locale-coding-system", &Vlocale_coding_system,
41026
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10178 doc: /* Coding system to use with system messages.
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10179 Also used for decoding keyboard input on X Window system. */);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10180 Vlocale_coding_system = Qnil;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10181
29182
1d1c27067af4 (encode_eol): Add null statement after label.
Dave Love <fx@gnu.org>
parents: 29172
diff changeset
10182 /* The eol mnemonics are reset in startup.el system-dependently. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10183 DEFVAR_LISP ("eol-mnemonic-unix", &eol_mnemonic_unix,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10184 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10185 *String displayed in mode line for UNIX-like (LF) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10186 eol_mnemonic_unix = build_string (":");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10187
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10188 DEFVAR_LISP ("eol-mnemonic-dos", &eol_mnemonic_dos,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10189 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10190 *String displayed in mode line for DOS-like (CRLF) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10191 eol_mnemonic_dos = build_string ("\\");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10192
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10193 DEFVAR_LISP ("eol-mnemonic-mac", &eol_mnemonic_mac,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10194 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10195 *String displayed in mode line for MAC-like (CR) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10196 eol_mnemonic_mac = build_string ("/");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10197
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10198 DEFVAR_LISP ("eol-mnemonic-undecided", &eol_mnemonic_undecided,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10199 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10200 *String displayed in mode line when end-of-line format is not yet determined. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10201 eol_mnemonic_undecided = build_string (":");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10202
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10203 DEFVAR_LISP ("enable-character-translation", &Venable_character_translation,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10204 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10205 *Non-nil enables character translation while encoding and decoding. */);
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10206 Venable_character_translation = Qt;
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10207
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10208 DEFVAR_LISP ("standard-translation-table-for-decode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10209 &Vstandard_translation_table_for_decode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10210 doc: /* Table for translating characters while decoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10211 Vstandard_translation_table_for_decode = Qnil;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10212
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10213 DEFVAR_LISP ("standard-translation-table-for-encode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10214 &Vstandard_translation_table_for_encode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10215 doc: /* Table for translating characters while encoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10216 Vstandard_translation_table_for_encode = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10217
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10218 DEFVAR_LISP ("charset-revision-table", &Vcharset_revision_table,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10219 doc: /* Alist of charsets vs revision numbers.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10220 While encoding, if a charset (car part of an element) is found,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10221 designate it with the escape sequence identifying revision (cdr part
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10222 of the element). */);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10223 Vcharset_revision_table = Qnil;
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10224
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10225 DEFVAR_LISP ("default-process-coding-system",
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10226 &Vdefault_process_coding_system,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10227 doc: /* Cons of coding systems used for process I/O by default.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10228 The car part is used for decoding a process output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10229 the cdr part is used for encoding a text to be sent to a process. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10230 Vdefault_process_coding_system = Qnil;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10231
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10232 DEFVAR_LISP ("latin-extra-code-table", &Vlatin_extra_code_table,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10233 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10234 Table of extra Latin codes in the range 128..159 (inclusive).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10235 This is a vector of length 256.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10236 If Nth element is non-nil, the existence of code N in a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10237 \(or output of subprocess) doesn't prevent it to be detected as
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10238 a coding system of ISO 2022 variant which has a flag
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10239 `accept-latin-extra-code' t (e.g. iso-latin-1) on reading a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10240 or reading output of a subprocess.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10241 Only 128th through 159th elements have a meaning. */);
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10242 Vlatin_extra_code_table = Fmake_vector (make_number (256), Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10243
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10244 DEFVAR_LISP ("select-safe-coding-system-function",
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10245 &Vselect_safe_coding_system_function,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10246 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10247 Function to call to select safe coding system for encoding a text.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10248
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10249 If set, this function is called to force a user to select a proper
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10250 coding system which can encode the text in the case that a default
87778
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10251 coding system used in each operation can't encode the text. The
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10252 function should take care that the buffer is not modified while
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10253 the coding system is being selected.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10254
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10255 The default value is `select-safe-coding-system' (which see). */);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10256 Vselect_safe_coding_system_function = Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10257
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10258 DEFVAR_BOOL ("coding-system-require-warning",
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10259 &coding_system_require_warning,
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10260 doc: /* Internal use only.
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10261 If non-nil, on writing a file, `select-safe-coding-system-function' is
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10262 called even if `coding-system-for-write' is non-nil. The command
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10263 `universal-coding-system-argument' binds this variable to t temporarily. */);
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10264 coding_system_require_warning = 0;
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10265
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10266
30292
14a9937df1f5 (syms_of_coding): Fix typo in spelling of variable
Gerd Moellmann <gerd@gnu.org>
parents: 30263
diff changeset
10267 DEFVAR_BOOL ("inhibit-iso-escape-detection",
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10268 &inhibit_iso_escape_detection,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10269 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10270 If non-nil, Emacs ignores ISO2022's escape sequence on code detection.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10271
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10272 By default, on reading a file, Emacs tries to detect how the text is
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10273 encoded. This code detection is sensitive to escape sequences. If
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10274 the sequence is valid as ISO2022, the code is determined as one of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10275 the ISO2022 encodings, and the file is decoded by the corresponding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10276 coding system (e.g. `iso-2022-7bit').
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10277
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10278 However, there may be a case that you want to read escape sequences in
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10279 a file as is. In such a case, you can set this variable to non-nil.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10280 Then, as the code detection ignores any escape sequences, no file is
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10281 detected as encoded in some ISO2022 encoding. The result is that all
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10282 escape sequences become visible in a buffer.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10283
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10284 The default value is nil, and it is strongly recommended not to change
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10285 it. That is because many Emacs Lisp source files that contain
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10286 non-ASCII characters are encoded by the coding system `iso-2022-7bit'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10287 in Emacs's distribution, and they won't be decoded correctly on
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10288 reading if you suppress escape sequence detection.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10289
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10290 The other way to read escape sequences in a file without decoding is
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10291 to explicitly specify some coding system that doesn't use ISO2022's
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10292 escape sequence (e.g `latin-1') on reading by \\[universal-coding-system-argument]. */);
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10293 inhibit_iso_escape_detection = 0;
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10294
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10295 DEFVAR_LISP ("translation-table-for-input", &Vtranslation_table_for_input,
48230
c2ce8280fb97 (Vtranslation_table_for_input): New.
Dave Love <fx@gnu.org>
parents: 48182
diff changeset
10296 doc: /* Char table for translating self-inserting characters.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10297 This is applied to the result of input methods, not their input.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10298 See also `keyboard-translate-table'. */);
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10299 Vtranslation_table_for_input = Qnil;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10300
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10301 {
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10302 Lisp_Object args[coding_arg_max];
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10303 Lisp_Object plist[16];
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10304 int i;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10305
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10306 for (i = 0; i < coding_arg_max; i++)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10307 args[i] = Qnil;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10308
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10309 plist[0] = intern (":name");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10310 plist[1] = args[coding_arg_name] = Qno_conversion;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10311 plist[2] = intern (":mnemonic");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10312 plist[3] = args[coding_arg_mnemonic] = make_number ('=');
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10313 plist[4] = intern (":coding-type");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10314 plist[5] = args[coding_arg_coding_type] = Qraw_text;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10315 plist[6] = intern (":ascii-compatible-p");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10316 plist[7] = args[coding_arg_ascii_compatible_p] = Qt;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10317 plist[8] = intern (":default-char");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10318 plist[9] = args[coding_arg_default_char] = make_number (0);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10319 plist[10] = intern (":for-unibyte");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10320 plist[11] = args[coding_arg_for_unibyte] = Qt;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10321 plist[12] = intern (":docstring");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10322 plist[13] = build_string ("Do no conversion.\n\
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10323 \n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10324 When you visit a file with this coding, the file is read into a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10325 unibyte buffer as is, thus each byte of a file is treated as a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10326 character.");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10327 plist[14] = intern (":eol-type");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10328 plist[15] = args[coding_arg_eol_type] = Qunix;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10329 args[coding_arg_plist] = Flist (16, plist);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10330 Fdefine_coding_system_internal (coding_arg_max, args);
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10331
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10332 plist[1] = args[coding_arg_name] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10333 plist[3] = args[coding_arg_mnemonic] = make_number ('-');
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10334 plist[5] = args[coding_arg_coding_type] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10335 /* This is already set.
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10336 plist[7] = args[coding_arg_ascii_compatible_p] = Qt; */
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10337 plist[8] = intern (":charset-list");
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10338 plist[9] = args[coding_arg_charset_list] = Fcons (Qascii, Qnil);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10339 plist[11] = args[coding_arg_for_unibyte] = Qnil;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10340 plist[13] = build_string ("No conversion on encoding, automatic conversion on decoding.");
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10341 plist[15] = args[coding_arg_eol_type] = Qnil;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10342 args[coding_arg_plist] = Flist (16, plist);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10343 Fdefine_coding_system_internal (coding_arg_max, args);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10344 }
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10345
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10346 setup_coding_system (Qno_conversion, &safe_terminal_coding);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10347
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10348 {
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10349 int i;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10350
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10351 for (i = 0; i < coding_category_max; i++)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10352 Fset (AREF (Vcoding_category_table, i), Qno_conversion);
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10353 }
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10354 #if defined (MSDOS) || defined (WINDOWSNT)
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10355 system_eol_type = Qdos;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10356 #else
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10357 system_eol_type = Qunix;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10358 #endif
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10359 staticpro (&system_eol_type);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10360 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10361
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10362 char *
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10363 emacs_strerror (error_number)
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10364 int error_number;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10365 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10366 char *str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10367
26526
b7438760079b * callproc.c (strerror): Remove decl.
Paul Eggert <eggert@twinsun.com>
parents: 26240
diff changeset
10368 synchronize_system_messages_locale ();
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10369 str = strerror (error_number);
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10370
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10371 if (! NILP (Vlocale_coding_system))
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10372 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10373 Lisp_Object dec = code_convert_string_norecord (build_string (str),
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10374 Vlocale_coding_system,
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10375 0);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
10376 str = (char *) SDATA (dec);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10377 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10378
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10379 return str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10380 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10381
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10382 #endif /* emacs */
29184
446621f88d68 Fix junk from last checkin.
Dave Love <fx@gnu.org>
parents: 29182
diff changeset
10383
52401
695cf19ef79e Add arch taglines
Miles Bader <miles@gnu.org>
parents: 52354
diff changeset
10384 /* arch-tag: 3a3a2b01-5ff6-4071-9afe-f5b808d9229d
695cf19ef79e Add arch taglines
Miles Bader <miles@gnu.org>
parents: 52354
diff changeset
10385 (do not change this comment) */