annotate src/coding.c @ 103104:2380af35be5c

(init_atimer): Also clear stopped_atimers.
author YAMAMOTO Mitsuharu <mituharu@math.s.chiba-u.ac.jp>
date Wed, 29 Apr 2009 03:48:38 +0000
parents e68707cf48a5
children 2f7395806731
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88936
c6ed294ee664 Comment fix
Dave Love <fx@gnu.org>
parents: 88889
diff changeset
1 /* Coding system handler (conversion, detection, etc).
68651
3bd95f4f2941 Update years in copyright notice; nfc.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents: 68567
diff changeset
2 Copyright (C) 2001, 2002, 2003, 2004, 2005,
100951
e038c1a8307c Add 2009 to copyright years.
Glenn Morris <rgm@gnu.org>
parents: 100936
diff changeset
3 2006, 2007, 2008, 2009 Free Software Foundation, Inc.
74605
6ee41fdd69ff Update AIST copyright years.
Kenichi Handa <handa@m17n.org>
parents: 73995
diff changeset
4 Copyright (C) 1995, 1996, 1997, 1998, 1999, 2000, 2001, 2002, 2003, 2004,
100951
e038c1a8307c Add 2009 to copyright years.
Glenn Morris <rgm@gnu.org>
parents: 100936
diff changeset
5 2005, 2006, 2007, 2008, 2009
67658
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
547f2b420666 Copyright fixed
Kenichi Handa <handa@m17n.org>
parents: 67555
diff changeset
7 Registration Number H14PRO021
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8 Copyright (C) 2003
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9 National Institute of Advanced Industrial Science and Technology (AIST)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10 Registration Number H13PRO009
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
11
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
12 This file is part of GNU Emacs.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
13
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
14 GNU Emacs is free software: you can redistribute it and/or modify
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
15 it under the terms of the GNU General Public License as published by
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
16 the Free Software Foundation, either version 3 of the License, or
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
17 (at your option) any later version.
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
18
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
19 GNU Emacs is distributed in the hope that it will be useful,
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
20 but WITHOUT ANY WARRANTY; without even the implied warranty of
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
21 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
22 GNU General Public License for more details.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
23
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
24 You should have received a copy of the GNU General Public License
94963
8971ddf55736 Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents: 94944
diff changeset
25 along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
26
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
27 /*** TABLE OF CONTENTS ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
28
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
29 0. General comments
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
30 1. Preamble
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
31 2. Emacs' internal format (emacs-utf-8) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
32 3. UTF-8 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
33 4. UTF-16 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
34 5. Charset-base coding systems handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
35 6. emacs-mule (old Emacs' internal format) handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
36 7. ISO2022 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
37 8. Shift-JIS and BIG5 handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
38 9. CCL handlers
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
39 10. C library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
40 11. Emacs Lisp library functions
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
41 12. Postamble
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
42
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
43 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
44
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
45 /*** 0. General comments ***
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
46
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
47
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
48 CODING SYSTEM
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
49
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
50 A coding system is an object for an encoding mechanism that contains
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
51 information about how to convert byte sequences to character
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
52 sequences and vice versa. When we say "decode", it means converting
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
53 a byte sequence of a specific coding system into a character
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
54 sequence that is represented by Emacs' internal coding system
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
55 `emacs-utf-8', and when we say "encode", it means converting a
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
56 character sequence of emacs-utf-8 to a byte sequence of a specific
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
57 coding system.
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
58
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
59 In Emacs Lisp, a coding system is represented by a Lisp symbol. In
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
60 C level, a coding system is represented by a vector of attributes
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
61 stored in the hash table Vcharset_hash_table. The conversion from
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
62 coding system symbol to attributes vector is done by looking up
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
63 Vcharset_hash_table by the symbol.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
64
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
65 Coding systems are classified into the following types depending on
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
66 the encoding mechanism. Here's a brief description of the types.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
67
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
68 o UTF-8
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
69
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
70 o UTF-16
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
71
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
72 o Charset-base coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
73
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
74 A coding system defined by one or more (coded) character sets.
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
75 Decoding and encoding are done by a code converter defined for each
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
76 character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
77
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
78 o Old Emacs internal format (emacs-mule)
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
79
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
80 The coding system adopted by old versions of Emacs (20 and 21).
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
81
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
82 o ISO2022-base coding system
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
83
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
84 The most famous coding system for multiple character sets. X's
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
85 Compound Text, various EUCs (Extended Unix Code), and coding systems
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
86 used in the Internet communication such as ISO-2022-JP are all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
87 variants of ISO2022.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
88
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
89 o SJIS (or Shift-JIS or MS-Kanji-Code)
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
90
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
91 A coding system to encode character sets: ASCII, JISX0201, and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
92 JISX0208. Widely used for PC's in Japan. Details are described in
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
93 section 8.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
94
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
95 o BIG5
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
96
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
97 A coding system to encode character sets: ASCII and Big5. Widely
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
98 used for Chinese (mainly in Taiwan and Hong Kong). Details are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
99 described in section 8. In this file, when we write "big5" (all
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
100 lowercase), we mean the coding system, and when we write "Big5"
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
101 (capitalized), we mean the character set.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
102
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
103 o CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
104
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
105 If a user wants to decode/encode text encoded in a coding system
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
106 not listed above, he can supply a decoder and an encoder for it in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
107 CCL (Code Conversion Language) programs. Emacs executes the CCL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
108 program while decoding/encoding.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
109
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
110 o Raw-text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
111
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
112 A coding system for text containing raw eight-bit data. Emacs
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
113 treats each byte of source text as a character (except for
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
114 end-of-line conversion).
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
115
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
116 o No-conversion
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
117
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
118 Like raw text, but don't do end-of-line conversion.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
119
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
120
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
121 END-OF-LINE FORMAT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
122
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
123 How text end-of-line is encoded depends on operating system. For
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
124 instance, Unix's format is just one byte of LF (line-feed) code,
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
125 whereas DOS's format is two-byte sequence of `carriage-return' and
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
126 `line-feed' codes. MacOS's format is usually one byte of
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
127 `carriage-return'.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
128
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
129 Since text character encoding and end-of-line encoding are
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
130 independent, any coding system described above can take any format
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
131 of end-of-line (except for no-conversion).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
132
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
133 STRUCT CODING_SYSTEM
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
134
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
135 Before using a coding system for code conversion (i.e. decoding and
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
136 encoding), we setup a structure of type `struct coding_system'.
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
137 This structure keeps various information about a specific code
88485
e92f62c0073e Doc fixes.
Dave Love <fx@gnu.org>
parents: 88477
diff changeset
138 conversion (e.g. the location of source and destination data).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
139
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
140 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
141
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
142 /* COMMON MACROS */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
143
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
144
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
145 /*** GENERAL NOTES on `detect_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
146
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
147 These functions check if a byte sequence specified as a source in
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
148 CODING conforms to the format of XXX, and update the members of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
149 DETECT_INFO.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
150
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
151 Return 1 if the byte sequence conforms to XXX, otherwise return 0.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
152
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
153 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
154
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
155 #if 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
156 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
157 detect_coding_XXX (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
158 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
159 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
160 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
161 const unsigned char *src = coding->source;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
162 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
163 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
164 int consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
165 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
166 ...;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
167
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
168 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
169 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
170 /* Get one byte from the source. If the souce is exausted, jump
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
171 to no_more_source:. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
172 ONE_MORE_BYTE (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
173
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
174 if (! __C_conforms_to_XXX___ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
175 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
176 if (! __C_strongly_suggests_XXX__ (c))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
177 found = CATEGORY_MASK_XXX;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
178 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
179 /* The byte sequence is invalid for XXX. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
180 detect_info->rejected |= CATEGORY_MASK_XXX;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
181 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
182
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
183 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
184 /* The source exausted successfully. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
185 detect_info->found |= found;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
186 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
187 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
188 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
189
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
190 /*** GENERAL NOTES on `decode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
191
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
192 These functions decode a byte sequence specified as a source by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
193 CODING. The resulting multibyte text goes to a place pointed to by
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
194 CODING->charbuf, the length of which should not exceed
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
195 CODING->charbuf_size;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
196
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
197 These functions set the information of original and decoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
198 CODING->consumed, CODING->consumed_char, and CODING->charbuf_used.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
199 They also set CODING->result to one of CODING_RESULT_XXX indicating
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
200 how the decoding is finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
201
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
202 Below is the template of these functions. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
203
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
204 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
205 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
206 decode_coding_XXXX (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
207 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
208 {
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
209 const unsigned char *src = coding->source + coding->consumed;
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
210 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
211 /* SRC_BASE remembers the start position in source in each loop.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
212 The loop will be exited when there's not enough source code, or
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
213 when there's no room in CHARBUF for a decoded character. */
90070
95879cc1ed20 Revision: miles@gnu.org--gnu-2004/emacs--unicode--0--patch-81
Miles Bader <miles@gnu.org>
parents: 90061 59173
diff changeset
214 const unsigned char *src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
215 /* A buffer to produce decoded characters. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
216 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
217 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
218 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
219
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
220 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
221 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
222 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
223 if (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
224 /* No more room to produce a decoded character. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
225 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
226 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
227 /* Decode it. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
228 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
229
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
230 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
231 if (src_base < src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
232 && coding->mode & CODING_MODE_LAST_BLOCK)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
233 /* If the source ends by partial bytes to construct a character,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
234 treat them as eight-bit raw data. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
235 while (src_base < src_end && charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
236 *charbuf++ = *src_base++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
237 /* Remember how many bytes and characters we consumed. If the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
238 source is multibyte, the bytes and chars are not identical. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
239 coding->consumed = coding->consumed_char = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
240 /* Remember how many characters we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
241 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
242 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
243 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
244
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
245 /*** GENERAL NOTES on `encode_coding_XXX ()' functions ***
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
246
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
247 These functions encode SRC_BYTES length text at SOURCE of Emacs'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
248 internal multibyte format by CODING. The resulting byte sequence
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
249 goes to a place pointed to by DESTINATION, the length of which
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
250 should not exceed DST_BYTES.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
251
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
252 These functions set the information of original and encoded texts in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
253 the members produced, produced_char, consumed, and consumed_char of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
254 the structure *CODING. They also set the member result to one of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
255 CODING_RESULT_XXX indicating how the encoding finished.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
256
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
257 DST_BYTES zero means that source area and destination area are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
258 overlapped, which means that we can produce a encoded text until it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
259 reaches at the head of not-yet-encoded source text.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
260
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
261 Below is a template of these functions. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
262 #if 0
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
263 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
264 encode_coding_XXX (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
265 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
266 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
267 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
268 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
269 int *charbuf_end = charbuf->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
270 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
271 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
272 unsigned char *adjusted_dst_end = dst_end - _MAX_BYTES_PRODUCED_IN_LOOP_;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
273 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
274
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
275 for (; charbuf < charbuf_end && dst < adjusted_dst_end; charbuf++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
276 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
277 int c = *charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
278 /* Encode C into DST, and increment DST. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
279 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
280 label_no_more_destination:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
281 /* How many chars and bytes we produced. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
282 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
283 coding->produced = dst - coding->destination;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
284 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
285 #endif
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
286
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
287
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
288 /*** 1. Preamble ***/
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
289
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
290 #include <config.h>
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
291 #include <stdio.h>
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
292
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
293 #include "lisp.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
294 #include "buffer.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
295 #include "character.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
296 #include "charset.h"
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
297 #include "ccl.h"
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
298 #include "composite.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
299 #include "coding.h"
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
300 #include "window.h"
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
301 #include "frame.h"
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
302 #include "termhooks.h"
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
303
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
304 Lisp_Object Vcoding_system_hash_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
305
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
306 Lisp_Object Qcoding_system, Qcoding_aliases, Qeol_type;
88646
d3b1f30e2267 (Qmac): Remove (duplicated) definition.
Dave Love <fx@gnu.org>
parents: 88645
diff changeset
307 Lisp_Object Qunix, Qdos;
d3b1f30e2267 (Qmac): Remove (duplicated) definition.
Dave Love <fx@gnu.org>
parents: 88645
diff changeset
308 extern Lisp_Object Qmac; /* frame.c */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
309 Lisp_Object Qbuffer_file_coding_system;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
310 Lisp_Object Qpost_read_conversion, Qpre_write_conversion;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
311 Lisp_Object Qdefault_char;
19612
783efd6c7c1e (Qno_conversion, Qundecided): New variables.
Kenichi Handa <handa@m17n.org>
parents: 19546
diff changeset
312 Lisp_Object Qno_conversion, Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
313 Lisp_Object Qcharset, Qiso_2022, Qutf_8, Qutf_16, Qshift_jis, Qbig5;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
314 Lisp_Object Qbig, Qlittle;
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
315 Lisp_Object Qcoding_system_history;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
316 Lisp_Object Qvalid_codes;
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
317 Lisp_Object QCcategory, QCmnemonic, QCdefault_char;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
318 Lisp_Object QCdecode_translation_table, QCencode_translation_table;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
319 Lisp_Object QCpost_read_conversion, QCpre_write_conversion;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
320 Lisp_Object QCascii_compatible_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
321
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
322 extern Lisp_Object Qinsert_file_contents, Qwrite_region;
64251
3de1b955c31a * coding.c (Qprocess_argument):
Kim F. Storm <storm@cua.dk>
parents: 64084
diff changeset
323 Lisp_Object Qcall_process, Qcall_process_region;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
324 Lisp_Object Qstart_process, Qopen_network_stream;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
325 Lisp_Object Qtarget_idx;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
326
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
327 Lisp_Object Qinsufficient_source, Qinconsistent_eol, Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
328 Lisp_Object Qinterrupted, Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
329
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
330 extern Lisp_Object Qcompletion_ignore_case;
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
331
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
332 /* If a symbol has this property, evaluate the value to define the
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
333 symbol as a coding system. */
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
334 static Lisp_Object Qcoding_system_define_form;
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
335
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
336 int coding_system_require_warning;
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
337
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
338 Lisp_Object Vselect_safe_coding_system_function;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
339
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
340 /* Mnemonic string for each format of end-of-line. */
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
341 Lisp_Object eol_mnemonic_unix, eol_mnemonic_dos, eol_mnemonic_mac;
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
342 /* Mnemonic string to indicate format of end-of-line is not yet
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
343 decided. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
344 Lisp_Object eol_mnemonic_undecided;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
345
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
346 /* Format of end-of-line decided by system. This is Qunix on
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
347 Unix and Mac, Qdos on DOS/Windows.
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
348 This has an effect only for external encoding (i.e. for output to
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
349 file and process), not for in-buffer or Lisp string encoding. */
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
350 static Lisp_Object system_eol_type;
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
351
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
352 #ifdef emacs
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
353
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
354 Lisp_Object Vcoding_system_list, Vcoding_system_alist;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
355
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
356 Lisp_Object Qcoding_system_p, Qcoding_system_error;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
357
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
358 /* Coding system emacs-mule and raw-text are for converting only
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
359 end-of-line format. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
360 Lisp_Object Qemacs_mule, Qraw_text;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
361 Lisp_Object Qutf_8_emacs;
51406
3c675181c3d8 (Qutf_8): New.
Dave Love <fx@gnu.org>
parents: 51356
diff changeset
362
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
363 /* Coding-systems are handed between Emacs Lisp programs and C internal
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
364 routines by the following three variables. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
365 /* Coding-system for reading files and receiving data from process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
366 Lisp_Object Vcoding_system_for_read;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
367 /* Coding-system for writing files and sending data to process. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
368 Lisp_Object Vcoding_system_for_write;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
369 /* Coding-system actually used in the latest I/O. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
370 Lisp_Object Vlast_coding_system_used;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
371 /* Set to non-nil when an error is detected while code conversion. */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
372 Lisp_Object Vlast_code_conversion_error;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
373 /* A vector of length 256 which contains information about special
22529
d9eac134a41b Doc fixes.
Karl Heuer <kwzh@gnu.org>
parents: 22502
diff changeset
374 Latin codes (especially for dealing with Microsoft codes). */
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
375 Lisp_Object Vlatin_extra_code_table;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
376
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
377 /* Flag to inhibit code conversion of end-of-line format. */
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
378 int inhibit_eol_conversion;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
379
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
380 /* Flag to inhibit ISO2022 escape sequence detection. */
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
381 int inhibit_iso_escape_detection;
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
382
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
383 /* Flag to inhibit detection of binary files through null bytes. */
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
384 int inhibit_null_byte_detection;
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
385
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
386 /* Flag to make buffer-file-coding-system inherit from process-coding. */
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
387 int inherit_process_coding_system;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
388
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
389 /* Coding system to be used to encode text for terminal display when
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
390 terminal coding system is nil. */
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
391 struct coding_system safe_terminal_coding;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
392
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
393 Lisp_Object Vfile_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
394 Lisp_Object Vprocess_coding_system_alist;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
395 Lisp_Object Vnetwork_coding_system_alist;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
396
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
397 Lisp_Object Vlocale_coding_system;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
398
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
399 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
400
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
401 /* Flag to tell if we look up translation table on character code
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
402 conversion. */
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
403 Lisp_Object Venable_character_translation;
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
404 /* Standard translation table to look up on decoding (reading). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
405 Lisp_Object Vstandard_translation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
406 /* Standard translation table to look up on encoding (writing). */
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
407 Lisp_Object Vstandard_translation_table_for_encode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
408
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
409 Lisp_Object Qtranslation_table;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
410 Lisp_Object Qtranslation_table_id;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
411 Lisp_Object Qtranslation_table_for_decode;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
412 Lisp_Object Qtranslation_table_for_encode;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
413
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
414 /* Alist of charsets vs revision number. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
415 static Lisp_Object Vcharset_revision_table;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
416
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
417 /* Default coding systems used for process I/O. */
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
418 Lisp_Object Vdefault_process_coding_system;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
419
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
420 /* Char table for translating Quail and self-inserting input. */
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
421 Lisp_Object Vtranslation_table_for_input;
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
422
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
423 /* Two special coding systems. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
424 Lisp_Object Vsjis_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
425 Lisp_Object Vbig5_coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
426
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
427 /* ISO2022 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
428
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
429 #define CODING_ISO_INITIAL(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
430 (XINT (AREF (AREF (CODING_ID_ATTRS ((coding)->id), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
431 coding_attr_iso_initial), \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
432 reg)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
433
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
434
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
435 #define CODING_ISO_REQUEST(coding, charset_id) \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
436 (((charset_id) <= (coding)->max_charset_id \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
437 ? ((coding)->safe_charsets[charset_id] != 255 \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
438 ? (coding)->safe_charsets[charset_id] \
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
439 : -1) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
440 : -1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
441
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
442
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
443 #define CODING_ISO_FLAGS(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
444 ((coding)->spec.iso_2022.flags)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
445 #define CODING_ISO_DESIGNATION(coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
446 ((coding)->spec.iso_2022.current_designation[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
447 #define CODING_ISO_INVOCATION(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
448 ((coding)->spec.iso_2022.current_invocation[plane])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
449 #define CODING_ISO_SINGLE_SHIFTING(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
450 ((coding)->spec.iso_2022.single_shifting)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
451 #define CODING_ISO_BOL(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
452 ((coding)->spec.iso_2022.bol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
453 #define CODING_ISO_INVOKED_CHARSET(coding, plane) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
454 CODING_ISO_DESIGNATION ((coding), CODING_ISO_INVOCATION ((coding), (plane)))
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
455 #define CODING_ISO_CMP_STATUS(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
456 (&(coding)->spec.iso_2022.cmp_status)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
457 #define CODING_ISO_EXTSEGMENT_LEN(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
458 ((coding)->spec.iso_2022.ctext_extended_segment_len)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
459 #define CODING_ISO_EMBEDDED_UTF_8(coding) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
460 ((coding)->spec.iso_2022.embedded_utf_8)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
461
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
462 /* Control characters of ISO2022. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
463 /* code */ /* function */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
464 #define ISO_CODE_LF 0x0A /* line-feed */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
465 #define ISO_CODE_CR 0x0D /* carriage-return */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
466 #define ISO_CODE_SO 0x0E /* shift-out */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
467 #define ISO_CODE_SI 0x0F /* shift-in */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
468 #define ISO_CODE_SS2_7 0x19 /* single-shift-2 for 7-bit code */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
469 #define ISO_CODE_ESC 0x1B /* escape */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
470 #define ISO_CODE_SS2 0x8E /* single-shift-2 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
471 #define ISO_CODE_SS3 0x8F /* single-shift-3 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
472 #define ISO_CODE_CSI 0x9B /* control-sequence-introducer */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
473
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
474 /* All code (1-byte) of ISO2022 is classified into one of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
475 followings. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
476 enum iso_code_class_type
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
477 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
478 ISO_control_0, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
479 0x00..0x1F and 0x7F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
480 following 5 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
481 ISO_shift_out, /* ISO_CODE_SO (0x0E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
482 ISO_shift_in, /* ISO_CODE_SI (0x0F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
483 ISO_single_shift_2_7, /* ISO_CODE_SS2_7 (0x19) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
484 ISO_escape, /* ISO_CODE_SO (0x1B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
485 ISO_control_1, /* Control codes in the range
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
486 0x80..0x9F, except for the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
487 following 3 codes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
488 ISO_single_shift_2, /* ISO_CODE_SS2 (0x8E) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
489 ISO_single_shift_3, /* ISO_CODE_SS3 (0x8F) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
490 ISO_control_sequence_introducer, /* ISO_CODE_CSI (0x9B) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
491 ISO_0x20_or_0x7F, /* Codes of the values 0x20 or 0x7F. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
492 ISO_graphic_plane_0, /* Graphic codes in the range 0x21..0x7E. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
493 ISO_0xA0_or_0xFF, /* Codes of the values 0xA0 or 0xFF. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
494 ISO_graphic_plane_1 /* Graphic codes in the range 0xA1..0xFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
495 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
496
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
497 /** The macros CODING_ISO_FLAG_XXX defines a flag bit of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
498 `iso-flags' attribute of an iso2022 coding system. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
499
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
500 /* If set, produce long-form designation sequence (e.g. ESC $ ( A)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
501 instead of the correct short-form sequence (e.g. ESC $ A). */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
502 #define CODING_ISO_FLAG_LONG_FORM 0x0001
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
503
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
504 /* If set, reset graphic planes and registers at end-of-line to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
505 initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
506 #define CODING_ISO_FLAG_RESET_AT_EOL 0x0002
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
507
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
508 /* If set, reset graphic planes and registers before any control
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
509 characters to the initial state. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
510 #define CODING_ISO_FLAG_RESET_AT_CNTL 0x0004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
511
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
512 /* If set, encode by 7-bit environment. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
513 #define CODING_ISO_FLAG_SEVEN_BITS 0x0008
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
514
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
515 /* If set, use locking-shift function. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
516 #define CODING_ISO_FLAG_LOCKING_SHIFT 0x0010
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
517
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
518 /* If set, use single-shift function. Overwrite
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
519 CODING_ISO_FLAG_LOCKING_SHIFT. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
520 #define CODING_ISO_FLAG_SINGLE_SHIFT 0x0020
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
521
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
522 /* If set, use designation escape sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
523 #define CODING_ISO_FLAG_DESIGNATION 0x0040
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
524
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
525 /* If set, produce revision number sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
526 #define CODING_ISO_FLAG_REVISION 0x0080
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
527
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
528 /* If set, produce ISO6429's direction specifying sequence. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
529 #define CODING_ISO_FLAG_DIRECTION 0x0100
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
530
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
531 /* If set, assume designation states are reset at beginning of line on
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
532 output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
533 #define CODING_ISO_FLAG_INIT_AT_BOL 0x0200
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
534
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
535 /* If set, designation sequence should be placed at beginning of line
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
536 on output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
537 #define CODING_ISO_FLAG_DESIGNATE_AT_BOL 0x0400
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
538
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
539 /* If set, do not encode unsafe charactes on output. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
540 #define CODING_ISO_FLAG_SAFE 0x0800
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
541
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
542 /* If set, extra latin codes (128..159) are accepted as a valid code
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
543 on input. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
544 #define CODING_ISO_FLAG_LATIN_EXTRA 0x1000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
545
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
546 #define CODING_ISO_FLAG_COMPOSITION 0x2000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
547
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
548 #define CODING_ISO_FLAG_EUC_TW_SHIFT 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
549
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
550 #define CODING_ISO_FLAG_USE_ROMAN 0x8000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
551
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
552 #define CODING_ISO_FLAG_USE_OLDJIS 0x10000
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
553
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
554 #define CODING_ISO_FLAG_FULL_SUPPORT 0x100000
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
555
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
556 /* A character to be produced on output if encoding of the original
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
557 character is prohibited by CODING_ISO_FLAG_SAFE. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
558 #define CODING_INHIBIT_CHARACTER_SUBSTITUTION '?'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
559
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
560 /* UTF-8 section */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
561 #define CODING_UTF_8_BOM(coding) \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
562 ((coding)->spec.utf_8_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
563
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
564 /* UTF-16 section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
565 #define CODING_UTF_16_BOM(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
566 ((coding)->spec.utf_16.bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
567
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
568 #define CODING_UTF_16_ENDIAN(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
569 ((coding)->spec.utf_16.endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
570
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
571 #define CODING_UTF_16_SURROGATE(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
572 ((coding)->spec.utf_16.surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
573
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
574
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
575 /* CCL section */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
576 #define CODING_CCL_DECODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
577 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_decoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
578 #define CODING_CCL_ENCODER(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
579 AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_encoder)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
580 #define CODING_CCL_VALIDS(coding) \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
581 (SDATA (AREF (CODING_ID_ATTRS ((coding)->id), coding_attr_ccl_valids)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
582
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
583 /* Index for each coding category in `coding_categories' */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
584
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
585 enum coding_category
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
586 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
587 coding_category_iso_7,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
588 coding_category_iso_7_tight,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
589 coding_category_iso_8_1,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
590 coding_category_iso_8_2,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
591 coding_category_iso_7_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
592 coding_category_iso_8_else,
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
593 coding_category_utf_8_auto,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
594 coding_category_utf_8_nosig,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
595 coding_category_utf_8_sig,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
596 coding_category_utf_16_auto,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
597 coding_category_utf_16_be,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
598 coding_category_utf_16_le,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
599 coding_category_utf_16_be_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
600 coding_category_utf_16_le_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
601 coding_category_charset,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
602 coding_category_sjis,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
603 coding_category_big5,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
604 coding_category_ccl,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
605 coding_category_emacs_mule,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
606 /* All above are targets of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
607 coding_category_raw_text,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
608 coding_category_undecided,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
609 coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
610 };
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
611
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
612 /* Definitions of flag bits used in detect_coding_XXXX. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
613 #define CATEGORY_MASK_ISO_7 (1 << coding_category_iso_7)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
614 #define CATEGORY_MASK_ISO_7_TIGHT (1 << coding_category_iso_7_tight)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
615 #define CATEGORY_MASK_ISO_8_1 (1 << coding_category_iso_8_1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
616 #define CATEGORY_MASK_ISO_8_2 (1 << coding_category_iso_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
617 #define CATEGORY_MASK_ISO_7_ELSE (1 << coding_category_iso_7_else)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
618 #define CATEGORY_MASK_ISO_8_ELSE (1 << coding_category_iso_8_else)
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
619 #define CATEGORY_MASK_UTF_8_AUTO (1 << coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
620 #define CATEGORY_MASK_UTF_8_NOSIG (1 << coding_category_utf_8_nosig)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
621 #define CATEGORY_MASK_UTF_8_SIG (1 << coding_category_utf_8_sig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
622 #define CATEGORY_MASK_UTF_16_AUTO (1 << coding_category_utf_16_auto)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
623 #define CATEGORY_MASK_UTF_16_BE (1 << coding_category_utf_16_be)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
624 #define CATEGORY_MASK_UTF_16_LE (1 << coding_category_utf_16_le)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
625 #define CATEGORY_MASK_UTF_16_BE_NOSIG (1 << coding_category_utf_16_be_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
626 #define CATEGORY_MASK_UTF_16_LE_NOSIG (1 << coding_category_utf_16_le_nosig)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
627 #define CATEGORY_MASK_CHARSET (1 << coding_category_charset)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
628 #define CATEGORY_MASK_SJIS (1 << coding_category_sjis)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
629 #define CATEGORY_MASK_BIG5 (1 << coding_category_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
630 #define CATEGORY_MASK_CCL (1 << coding_category_ccl)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
631 #define CATEGORY_MASK_EMACS_MULE (1 << coding_category_emacs_mule)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
632 #define CATEGORY_MASK_RAW_TEXT (1 << coding_category_raw_text)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
633
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
634 /* This value is returned if detect_coding_mask () find nothing other
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
635 than ASCII characters. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
636 #define CATEGORY_MASK_ANY \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
637 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
638 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
639 | CATEGORY_MASK_ISO_8_1 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
640 | CATEGORY_MASK_ISO_8_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
641 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
642 | CATEGORY_MASK_ISO_8_ELSE \
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
643 | CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
644 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
645 | CATEGORY_MASK_UTF_8_SIG \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
646 | CATEGORY_MASK_UTF_16_AUTO \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
647 | CATEGORY_MASK_UTF_16_BE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
648 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
649 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
650 | CATEGORY_MASK_UTF_16_LE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
651 | CATEGORY_MASK_CHARSET \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
652 | CATEGORY_MASK_SJIS \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
653 | CATEGORY_MASK_BIG5 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
654 | CATEGORY_MASK_CCL \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
655 | CATEGORY_MASK_EMACS_MULE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
656
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
657
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
658 #define CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
659 (CATEGORY_MASK_ISO_7 | CATEGORY_MASK_ISO_7_TIGHT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
660
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
661 #define CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
662 (CATEGORY_MASK_ISO_8_1 | CATEGORY_MASK_ISO_8_2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
663
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
664 #define CATEGORY_MASK_ISO_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
665 (CATEGORY_MASK_ISO_7_ELSE | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
666
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
667 #define CATEGORY_MASK_ISO_ESCAPE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
668 (CATEGORY_MASK_ISO_7 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
669 | CATEGORY_MASK_ISO_7_TIGHT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
670 | CATEGORY_MASK_ISO_7_ELSE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
671 | CATEGORY_MASK_ISO_8_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
672
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
673 #define CATEGORY_MASK_ISO \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
674 ( CATEGORY_MASK_ISO_7BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
675 | CATEGORY_MASK_ISO_8BIT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
676 | CATEGORY_MASK_ISO_ELSE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
677
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
678 #define CATEGORY_MASK_UTF_16 \
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
679 (CATEGORY_MASK_UTF_16_AUTO \
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
680 | CATEGORY_MASK_UTF_16_BE \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
681 | CATEGORY_MASK_UTF_16_LE \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
682 | CATEGORY_MASK_UTF_16_BE_NOSIG \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
683 | CATEGORY_MASK_UTF_16_LE_NOSIG)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
684
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
685 #define CATEGORY_MASK_UTF_8 \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
686 (CATEGORY_MASK_UTF_8_AUTO \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
687 | CATEGORY_MASK_UTF_8_NOSIG \
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
688 | CATEGORY_MASK_UTF_8_SIG)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
689
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
690 /* List of symbols `coding-category-xxx' ordered by priority. This
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
691 variable is exposed to Emacs Lisp. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
692 static Lisp_Object Vcoding_category_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
693
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
694 /* Table of coding categories (Lisp symbols). This variable is for
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
695 internal use oly. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
696 static Lisp_Object Vcoding_category_table;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
697
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
698 /* Table of coding-categories ordered by priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
699 static enum coding_category coding_priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
700
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
701 /* Nth element is a coding context for the coding system bound to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
702 Nth coding category. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
703 static struct coding_system coding_categories[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
704
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
705 /*** Commonly used macros and functions ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
706
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
707 #ifndef min
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
708 #define min(a, b) ((a) < (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
709 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
710 #ifndef max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
711 #define max(a, b) ((a) > (b) ? (a) : (b))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
712 #endif
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
713
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
714 #define CODING_GET_INFO(coding, attrs, charset_list) \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
715 do { \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
716 (attrs) = CODING_ID_ATTRS ((coding)->id); \
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
717 (charset_list) = CODING_ATTR_CHARSET_LIST (attrs); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
718 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
719
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
720
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
721 /* Safely get one byte from the source text pointed by SRC which ends
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
722 at SRC_END, and set C to that byte. If there are not enough bytes
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
723 in the source, it jumps to `no_more_source'. If multibytep is
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
724 nonzero, and a multibyte character is found at SRC, set C to the
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
725 negative value of the character code. The caller should declare
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
726 and set these variables appropriately in advance:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
727 src, src_end, multibytep */
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
728
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
729 #define ONE_MORE_BYTE(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
730 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
731 if (src == src_end) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
732 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
733 if (src_base < src) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
734 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
735 (coding, CODING_RESULT_INSUFFICIENT_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
736 goto no_more_source; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
737 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
738 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
739 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
740 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
741 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
742 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
743 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
744 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
745 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
746 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
747 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
748 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
749 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
750 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
751 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
752 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
753
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
754 /* Safely get two bytes from the source text pointed by SRC which ends
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
755 at SRC_END, and set C1 and C2 to those bytes while skipping the
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
756 heading multibyte characters. If there are not enough bytes in the
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
757 source, it jumps to `no_more_source'. If multibytep is nonzero and
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
758 a multibyte character is found for C2, set C2 to the negative value
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
759 of the character code. The caller should declare and set these
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
760 variables appropriately in advance:
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
761 src, src_end, multibytep
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
762 It is intended that this macro is used in detect_coding_utf_16. */
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
763
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
764 #define TWO_MORE_BYTES(c1, c2) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
765 do { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
766 do { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
767 if (src == src_end) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
768 goto no_more_source; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
769 c1 = *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
770 if (multibytep && (c1 & 0x80)) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
771 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
772 if ((c1 & 0xFE) == 0xC0) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
773 c1 = ((c1 & 1) << 6) | *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
774 else \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
775 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
776 src += BYTES_BY_CHAR_HEAD (c1) - 1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
777 c1 = -1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
778 } \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
779 } \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
780 } while (c1 < 0); \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
781 if (src == src_end) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
782 goto no_more_source; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
783 c2 = *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
784 if (multibytep && (c2 & 0x80)) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
785 { \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
786 if ((c2 & 0xFE) == 0xC0) \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
787 c2 = ((c2 & 1) << 6) | *src++; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
788 else \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
789 c2 = -1; \
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
790 } \
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
791 } while (0)
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
792
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
793
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
794 #define ONE_MORE_BYTE_NO_CHECK(c) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
795 do { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
796 c = *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
797 if (multibytep && (c & 0x80)) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
798 { \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
799 if ((c & 0xFE) == 0xC0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
800 c = ((c & 1) << 6) | *src++; \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
801 else \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
802 { \
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
803 src--; \
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
804 c = - string_char (src, &src, NULL); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
805 record_conversion_result \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
806 (coding, CODING_RESULT_INVALID_SRC); \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
807 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
808 } \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
809 consumed_chars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
810 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
811
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
812
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
813 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
814 next free point, and increment PRODUCED_CHARS. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
815 assure that C is 0..127, and declare and set the variable `dst'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
816 appropriately in advance.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
817 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
818
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
819
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
820 #define EMIT_ONE_ASCII_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
821 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
822 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
823 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
824 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
825
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
826
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
827 /* Like EMIT_ONE_ASCII_BYTE byt store two bytes; C1 and C2. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
828
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
829 #define EMIT_TWO_ASCII_BYTES(c1, c2) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
830 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
831 produced_chars += 2; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
832 *dst++ = (c1), *dst++ = (c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
833 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
834
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
835
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
836 /* Store a byte C in the place pointed by DST and increment DST to the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
837 next free point, and increment PRODUCED_CHARS. If MULTIBYTEP is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
838 nonzero, store in an appropriate multibyte from. The caller should
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
839 declare and set the variables `dst' and `multibytep' appropriately
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
840 in advance. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
841
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
842 #define EMIT_ONE_BYTE(c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
843 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
844 produced_chars++; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
845 if (multibytep) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
846 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
847 int ch = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
848 if (ch >= 0x80) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
849 ch = BYTE8_TO_CHAR (ch); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
850 CHAR_STRING_ADVANCE (ch, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
851 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
852 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
853 *dst++ = (c); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
854 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
855
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
856
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
857 /* Like EMIT_ONE_BYTE, but emit two bytes; C1 and C2. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
858
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
859 #define EMIT_TWO_BYTES(c1, c2) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
860 do { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
861 produced_chars += 2; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
862 if (multibytep) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
863 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
864 int ch; \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
865 \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
866 ch = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
867 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
868 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
869 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
870 ch = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
871 if (ch >= 0x80) \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
872 ch = BYTE8_TO_CHAR (ch); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
873 CHAR_STRING_ADVANCE (ch, dst); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
874 } \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
875 else \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
876 { \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
877 *dst++ = (c1); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
878 *dst++ = (c2); \
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
879 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
880 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
881
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
882
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
883 #define EMIT_THREE_BYTES(c1, c2, c3) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
884 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
885 EMIT_ONE_BYTE (c1); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
886 EMIT_TWO_BYTES (c2, c3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
887 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
888
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
889
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
890 #define EMIT_FOUR_BYTES(c1, c2, c3, c4) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
891 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
892 EMIT_TWO_BYTES (c1, c2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
893 EMIT_TWO_BYTES (c3, c4); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
894 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
895
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
896
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
897 /* Prototypes for static functions. */
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
898 static void record_conversion_result P_ ((struct coding_system *coding,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
899 enum coding_result_code result));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
900 static int detect_coding_utf_8 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
901 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
902 static void decode_coding_utf_8 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
903 static int encode_coding_utf_8 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
904
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
905 static int detect_coding_utf_16 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
906 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
907 static void decode_coding_utf_16 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
908 static int encode_coding_utf_16 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
909
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
910 static int detect_coding_iso_2022 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
911 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
912 static void decode_coding_iso_2022 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
913 static int encode_coding_iso_2022 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
914
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
915 static int detect_coding_emacs_mule P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
916 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
917 static void decode_coding_emacs_mule P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
918 static int encode_coding_emacs_mule P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
919
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
920 static int detect_coding_sjis P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
921 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
922 static void decode_coding_sjis P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
923 static int encode_coding_sjis P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
924
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
925 static int detect_coding_big5 P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
926 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
927 static void decode_coding_big5 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
928 static int encode_coding_big5 P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
929
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
930 static int detect_coding_ccl P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
931 struct coding_detection_info *info));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
932 static void decode_coding_ccl P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
933 static int encode_coding_ccl P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
934
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
935 static void decode_coding_raw_text P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
936 static int encode_coding_raw_text P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
937
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
938 static void coding_set_source P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
939 static void coding_set_destination P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
940 static void coding_alloc_by_realloc P_ ((struct coding_system *, EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
941 static void coding_alloc_by_making_gap P_ ((struct coding_system *,
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
942 EMACS_INT, EMACS_INT));
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
943 static unsigned char *alloc_destination P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
944 EMACS_INT, unsigned char *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
945 static void setup_iso_safe_charsets P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
946 static unsigned char *encode_designation_at_bol P_ ((struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
947 int *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
948 unsigned char *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
949 static int detect_eol P_ ((const unsigned char *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
950 EMACS_INT, enum coding_category));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
951 static Lisp_Object adjust_coding_eol_type P_ ((struct coding_system *, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
952 static void decode_eol P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
953 static Lisp_Object get_translation_table P_ ((Lisp_Object, int, int *));
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
954 static Lisp_Object get_translation P_ ((Lisp_Object, int *, int *));
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
955 static int produce_chars P_ ((struct coding_system *, Lisp_Object, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
956 static INLINE void produce_charset P_ ((struct coding_system *, int *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
957 EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
958 static void produce_annotation P_ ((struct coding_system *, EMACS_INT));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
959 static int decode_coding P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
960 static INLINE int *handle_composition_annotation P_ ((EMACS_INT, EMACS_INT,
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
961 struct coding_system *,
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
962 int *, EMACS_INT *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
963 static INLINE int *handle_charset_annotation P_ ((EMACS_INT, EMACS_INT,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
964 struct coding_system *,
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
965 int *, EMACS_INT *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
966 static void consume_chars P_ ((struct coding_system *, Lisp_Object, int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
967 static int encode_coding P_ ((struct coding_system *));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
968 static Lisp_Object make_conversion_work_buffer P_ ((int));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
969 static Lisp_Object code_conversion_restore P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
970 static INLINE int char_encodable_p P_ ((int, Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
971 static Lisp_Object make_subsidiaries P_ ((Lisp_Object));
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
972
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
973 static void
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
974 record_conversion_result (struct coding_system *coding,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
975 enum coding_result_code result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
976 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
977 coding->result = result;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
978 switch (result)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
979 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
980 case CODING_RESULT_INSUFFICIENT_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
981 Vlast_code_conversion_error = Qinsufficient_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
982 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
983 case CODING_RESULT_INCONSISTENT_EOL:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
984 Vlast_code_conversion_error = Qinconsistent_eol;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
985 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
986 case CODING_RESULT_INVALID_SRC:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
987 Vlast_code_conversion_error = Qinvalid_source;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
988 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
989 case CODING_RESULT_INTERRUPT:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
990 Vlast_code_conversion_error = Qinterrupted;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
991 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
992 case CODING_RESULT_INSUFFICIENT_MEM:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
993 Vlast_code_conversion_error = Qinsufficient_memory;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
994 break;
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
995 default:
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
996 Vlast_code_conversion_error = intern ("Unknown error");
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
997 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
998 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
999
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1000 #define CODING_DECODE_CHAR(coding, src, src_base, src_end, charset, code, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1001 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1002 charset_map_loaded = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1003 c = DECODE_CHAR (charset, code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1004 if (charset_map_loaded) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1005 { \
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1006 const unsigned char *orig = coding->source; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1007 EMACS_INT offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1008 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1009 coding_set_source (coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1010 offset = coding->source - orig; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1011 src += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1012 src_base += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1013 src_end += offset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1014 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1015 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1016
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1017
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1018 /* If there are at least BYTES length of room at dst, allocate memory
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1019 for coding->destination and update dst and dst_end. We don't have
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1020 to take care of coding->source which will be relocated. It is
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1021 handled by calling coding_set_source in encode_coding. */
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1022
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1023 #define ASSURE_DESTINATION(bytes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1024 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1025 if (dst + (bytes) >= dst_end) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1026 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1027 int more_bytes = charbuf_end - charbuf + (bytes); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1028 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1029 dst = alloc_destination (coding, more_bytes, dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1030 dst_end = coding->destination + coding->dst_bytes; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1031 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1032 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1033
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1034
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1035 /* Store multibyte form of the character C in P, and advance P to the
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1036 end of the multibyte form. This is like CHAR_STRING_ADVANCE but it
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1037 never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1038
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1039 #define CHAR_STRING_ADVANCE_NO_UNIFY(c, p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1040 do { \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1041 if ((c) <= MAX_1_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1042 *(p)++ = (c); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1043 else if ((c) <= MAX_2_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1044 *(p)++ = (0xC0 | ((c) >> 6)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1045 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1046 else if ((c) <= MAX_3_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1047 *(p)++ = (0xE0 | ((c) >> 12)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1048 *(p)++ = (0x80 | (((c) >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1049 *(p)++ = (0x80 | ((c) & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1050 else if ((c) <= MAX_4_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1051 *(p)++ = (0xF0 | (c >> 18)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1052 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1053 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1054 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1055 else if ((c) <= MAX_5_BYTE_CHAR) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1056 *(p)++ = 0xF8, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1057 *(p)++ = (0x80 | ((c >> 18) & 0x0F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1058 *(p)++ = (0x80 | ((c >> 12) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1059 *(p)++ = (0x80 | ((c >> 6) & 0x3F)), \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1060 *(p)++ = (0x80 | (c & 0x3F)); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1061 else \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1062 (p) += BYTE8_STRING ((c) - 0x3FFF80, p); \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1063 } while (0)
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1064
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1065
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1066 /* Return the character code of character whose multibyte form is at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1067 P, and advance P to the end of the multibyte form. This is like
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1068 STRING_CHAR_ADVANCE, but it never calls MAYBE_UNIFY_CHAR. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1069
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1070 #define STRING_CHAR_ADVANCE_NO_UNIFY(p) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1071 (!((p)[0] & 0x80) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1072 ? *(p)++ \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1073 : ! ((p)[0] & 0x20) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1074 ? ((p) += 2, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1075 ((((p)[-2] & 0x1F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1076 | ((p)[-1] & 0x3F) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1077 | ((unsigned char) ((p)[-2]) < 0xC2 ? 0x3FFF80 : 0))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1078 : ! ((p)[0] & 0x10) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1079 ? ((p) += 3, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1080 ((((p)[-3] & 0x0F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1081 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1082 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1083 : ! ((p)[0] & 0x08) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1084 ? ((p) += 4, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1085 ((((p)[-4] & 0xF) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1086 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1087 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1088 | ((p)[-1] & 0x3F))) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1089 : ((p) += 5, \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1090 ((((p)[-4] & 0x3F) << 18) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1091 | (((p)[-3] & 0x3F) << 12) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1092 | (((p)[-2] & 0x3F) << 6) \
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1093 | ((p)[-1] & 0x3F))))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1094
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1095
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1096 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1097 coding_set_source (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1098 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1099 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1100 if (BUFFERP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1101 {
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1102 struct buffer *buf = XBUFFER (coding->src_object);
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1103
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1104 if (coding->src_pos < 0)
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1105 coding->source = BUF_GAP_END_ADDR (buf) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1106 else
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
1107 coding->source = BUF_BYTE_ADDRESS (buf, coding->src_pos_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1108 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1109 else if (STRINGP (coding->src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1110 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1111 coding->source = SDATA (coding->src_object) + coding->src_pos_byte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1112 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1113 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1114 /* Otherwise, the source is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1115 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1116 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1117 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1118
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1119 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1120 coding_set_destination (coding)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1121 struct coding_system *coding;
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1122 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1123 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1124 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1125 if (coding->src_pos < 0)
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1126 {
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1127 coding->destination = BEG_ADDR + coding->dst_pos_byte - BEG_BYTE;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1128 coding->dst_bytes = (GAP_END_ADDR
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1129 - (coding->src_bytes - coding->consumed)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1130 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1131 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1132 else
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1133 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1134 /* We are sure that coding->dst_pos_byte is before the gap
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1135 of the buffer. */
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1136 coding->destination = (BUF_BEG_ADDR (XBUFFER (coding->dst_object))
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
1137 + coding->dst_pos_byte - BEG_BYTE);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1138 coding->dst_bytes = (BUF_GAP_END_ADDR (XBUFFER (coding->dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1139 - coding->destination);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1140 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1141 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1142 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1143 /* Otherwise, the destination is C string and is never relocated
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1144 automatically. Thus we don't have to update anything. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1145 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1146 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1147
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1148
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1149 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1150 coding_alloc_by_realloc (coding, bytes)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1151 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1152 EMACS_INT bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1153 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1154 coding->destination = (unsigned char *) xrealloc (coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1155 coding->dst_bytes + bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1156 coding->dst_bytes += bytes;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1157 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1158
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1159 static void
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1160 coding_alloc_by_making_gap (coding, gap_head_used, bytes)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1161 struct coding_system *coding;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1162 EMACS_INT gap_head_used, bytes;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1163 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1164 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1165 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1166 /* The gap may contain the produced data at the head and not-yet
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1167 consumed data at the tail. To preserve those data, we at
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1168 first make the gap size to zero, then increase the gap
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1169 size. */
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1170 EMACS_INT add = GAP_SIZE;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1171
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1172 GPT += gap_head_used, GPT_BYTE += gap_head_used;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1173 GAP_SIZE = 0; ZV += add; Z += add; ZV_BYTE += add; Z_BYTE += add;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1174 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1175 GAP_SIZE += add; ZV -= add; Z -= add; ZV_BYTE -= add; Z_BYTE -= add;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1176 GPT -= gap_head_used, GPT_BYTE -= gap_head_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1177 }
90292
697c08d95af7 Cancel incorrect synching with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90291
diff changeset
1178 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1179 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1180 Lisp_Object this_buffer;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1181
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
1182 this_buffer = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1183 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1184 make_gap (bytes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1185 set_buffer_internal (XBUFFER (this_buffer));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1186 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1187 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1188
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1189
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1190 static unsigned char *
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1191 alloc_destination (coding, nbytes, dst)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1192 struct coding_system *coding;
89545
4f394eed6ff2 (inhibit_pre_post_conversion): Removed (unused).
Dave Love <fx@gnu.org>
parents: 89519
diff changeset
1193 EMACS_INT nbytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1194 unsigned char *dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1195 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1196 EMACS_INT offset = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1197
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1198 if (BUFFERP (coding->dst_object))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1199 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1200 struct buffer *buf = XBUFFER (coding->dst_object);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1201
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1202 coding_alloc_by_making_gap (coding, dst - BUF_GPT_ADDR (buf), nbytes);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1203 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1204 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1205 coding_alloc_by_realloc (coding, nbytes);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1206 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1207 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1208 dst = coding->destination + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1209 return dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1210 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1211
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1212 /** Macros for annotations. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1213
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1214 /* An annotation data is stored in the array coding->charbuf in this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1215 format:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1216 [ -LENGTH ANNOTATION_MASK NCHARS ... ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1217 LENGTH is the number of elements in the annotation.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1218 ANNOTATION_MASK is one of CODING_ANNOTATE_XXX_MASK.
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1219 NCHARS is the number of characters in the text annotated.
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1220
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1221 The format of the following elements depend on ANNOTATION_MASK.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1222
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1223 In the case of CODING_ANNOTATE_COMPOSITION_MASK, these elements
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1224 follows:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1225 ... NBYTES METHOD [ COMPOSITION-COMPONENTS ... ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1226
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1227 NBYTES is the number of bytes specified in the header part of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1228 old-style emacs-mule encoding, or 0 for the other kind of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1229 composition.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1230
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1231 METHOD is one of enum composition_method.
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1232
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1233 Optionnal COMPOSITION-COMPONENTS are characters and composition
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1234 rules.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1235
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1236 In the case of CODING_ANNOTATE_CHARSET_MASK, one element CHARSET-ID
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1237 follows.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1238
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1239 If ANNOTATION_MASK is 0, this annotation is just a space holder to
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1240 recover from an invalid annotation, and should be skipped by
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1241 produce_annotation. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1242
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1243 /* Maximum length of the header of annotation data. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1244 #define MAX_ANNOTATION_LENGTH 5
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1245
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1246 #define ADD_ANNOTATION_DATA(buf, len, mask, nchars) \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1247 do { \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1248 *(buf)++ = -(len); \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1249 *(buf)++ = (mask); \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1250 *(buf)++ = (nchars); \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1251 coding->annotated = 1; \
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1252 } while (0);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1253
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1254 #define ADD_COMPOSITION_DATA(buf, nchars, nbytes, method) \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1255 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1256 ADD_ANNOTATION_DATA (buf, 5, CODING_ANNOTATE_COMPOSITION_MASK, nchars); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1257 *buf++ = nbytes; \
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1258 *buf++ = method; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1259 } while (0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1260
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1261
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1262 #define ADD_CHARSET_DATA(buf, nchars, id) \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1263 do { \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1264 ADD_ANNOTATION_DATA (buf, 4, CODING_ANNOTATE_CHARSET_MASK, nchars); \
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1265 *buf++ = id; \
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1266 } while (0)
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1267
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1268
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1269 /*** 2. Emacs' internal format (emacs-utf-8) ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1270
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1271
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
1272
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1273
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1274 /*** 3. UTF-8 ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1275
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1276 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1277 Check if a text is encoded in UTF-8. If it is, return 1, else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1278 return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1279
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1280 #define UTF_8_1_OCTET_P(c) ((c) < 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1281 #define UTF_8_EXTRA_OCTET_P(c) (((c) & 0xC0) == 0x80)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1282 #define UTF_8_2_OCTET_LEADING_P(c) (((c) & 0xE0) == 0xC0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1283 #define UTF_8_3_OCTET_LEADING_P(c) (((c) & 0xF0) == 0xE0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1284 #define UTF_8_4_OCTET_LEADING_P(c) (((c) & 0xF8) == 0xF0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1285 #define UTF_8_5_OCTET_LEADING_P(c) (((c) & 0xFC) == 0xF8)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1286
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1287 #define UTF_BOM 0xFEFF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1288 #define UTF_8_BOM_1 0xEF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1289 #define UTF_8_BOM_2 0xBB
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1290 #define UTF_8_BOM_3 0xBF
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1291
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1292 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1293 detect_coding_utf_8 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1294 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1295 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1296 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1297 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1298 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1299 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1300 int consumed_chars = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1301 int bom_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1302 int found = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1303
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1304 detect_info->checked |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1305 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1306 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1307
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1308 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1309 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1310 int c, c1, c2, c3, c4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1311
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1312 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1313 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1314 if (c < 0 || UTF_8_1_OCTET_P (c))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1315 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1316 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1317 if (c1 < 0 || ! UTF_8_EXTRA_OCTET_P (c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1318 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1319 if (UTF_8_2_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1320 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1321 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1322 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1323 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1324 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1325 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1326 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1327 if (UTF_8_3_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1328 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1329 found = 1;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1330 if (src_base == coding->source
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1331 && c == UTF_8_BOM_1 && c1 == UTF_8_BOM_2 && c2 == UTF_8_BOM_3)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1332 bom_found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1333 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1334 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1335 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1336 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1337 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1338 if (UTF_8_4_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1339 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1340 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1341 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1342 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1343 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1344 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1345 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1346 if (UTF_8_5_OCTET_LEADING_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1347 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1348 found = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1349 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1350 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1351 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1352 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1353 detect_info->rejected |= CATEGORY_MASK_UTF_8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1354 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1355
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1356 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1357 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1358 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1359 detect_info->rejected |= CATEGORY_MASK_UTF_8;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1360 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1361 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1362 if (bom_found)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1363 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1364 /* The first character 0xFFFE doesn't necessarily mean a BOM. */
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1365 detect_info->found |= CATEGORY_MASK_UTF_8_SIG | CATEGORY_MASK_UTF_8_NOSIG;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1366 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1367 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1368 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1369 detect_info->rejected |= CATEGORY_MASK_UTF_8_SIG;
96571
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1370 if (found)
a3f2a5a4b492 (detect_coding_utf_8): Set detect_info->found only when
Kenichi Handa <handa@m17n.org>
parents: 95585
diff changeset
1371 detect_info->found |= CATEGORY_MASK_UTF_8_NOSIG;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1372 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1373 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1374 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1375
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1376
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1377 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1378 decode_coding_utf_8 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1379 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1380 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1381 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1382 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1383 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1384 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1385 int *charbuf_end = coding->charbuf + coding->charbuf_size;
100133
bca35d7cb3ac (decode_coding_utf_8): Likewise.
Kenichi Handa <handa@m17n.org>
parents: 100131
diff changeset
1386 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1387 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1388 enum utf_bom_type bom = CODING_UTF_8_BOM (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1389 Lisp_Object attr, charset_list;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1390 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1391 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1392 int byte_after_cr = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1393
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1394 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1395
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1396 if (bom != utf_without_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1397 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1398 int c1, c2, c3;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1399
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1400 src_base = src;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1401 ONE_MORE_BYTE (c1);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1402 if (! UTF_8_3_OCTET_LEADING_P (c1))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1403 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1404 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1405 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1406 ONE_MORE_BYTE (c2);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1407 if (! UTF_8_EXTRA_OCTET_P (c2))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1408 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1409 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1410 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
1411 ONE_MORE_BYTE (c3);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1412 if (! UTF_8_EXTRA_OCTET_P (c3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1413 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1414 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1415 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1416 if ((c1 != UTF_8_BOM_1)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1417 || (c2 != UTF_8_BOM_2) || (c3 != UTF_8_BOM_3))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1418 src = src_base;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1419 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1420 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1421 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1422 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1423 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1424 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1425 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1426
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1427
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1428
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1429 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1430 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1431 int c, c1, c2, c3, c4, c5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1432
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1433 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1434 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1435
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1436 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1437 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1438 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1439 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1440 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1441 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1442
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1443 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1444 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1445 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1446 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1447 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1448 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1449 c = - c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1450 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1451 else if (UTF_8_1_OCTET_P(c1))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1452 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1453 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1454 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1455 c = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1456 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1457 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1458 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1459 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1460 if (c2 < 0 || ! UTF_8_EXTRA_OCTET_P (c2))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1461 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1462 if (UTF_8_2_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1463 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1464 c = ((c1 & 0x1F) << 6) | (c2 & 0x3F);
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1465 /* Reject overlong sequences here and below. Encoders
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1466 producing them are incorrect, they can be misleading,
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1467 and they mess up read/write invariance. */
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1468 if (c < 128)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1469 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1470 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1471 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1472 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1473 ONE_MORE_BYTE (c3);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1474 if (c3 < 0 || ! UTF_8_EXTRA_OCTET_P (c3))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1475 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1476 if (UTF_8_3_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1477 {
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1478 c = (((c1 & 0xF) << 12)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1479 | ((c2 & 0x3F) << 6) | (c3 & 0x3F));
89184
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1480 if (c < 0x800
88a9e962e183 (decode_coding_utf_8): Treat surrogates as invalid.
Dave Love <fx@gnu.org>
parents: 89042
diff changeset
1481 || (c >= 0xd800 && c < 0xe000)) /* surrogates (invalid) */
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1482 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1483 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1484 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1485 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1486 ONE_MORE_BYTE (c4);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1487 if (c4 < 0 || ! UTF_8_EXTRA_OCTET_P (c4))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1488 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1489 if (UTF_8_4_OCTET_LEADING_P (c1))
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1490 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1491 c = (((c1 & 0x7) << 18) | ((c2 & 0x3F) << 12)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1492 | ((c3 & 0x3F) << 6) | (c4 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1493 if (c < 0x10000)
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1494 goto invalid_code;
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1495 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1496 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1497 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1498 ONE_MORE_BYTE (c5);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1499 if (c5 < 0 || ! UTF_8_EXTRA_OCTET_P (c5))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1500 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1501 if (UTF_8_5_OCTET_LEADING_P (c1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1502 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1503 c = (((c1 & 0x3) << 24) | ((c2 & 0x3F) << 18)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1504 | ((c3 & 0x3F) << 12) | ((c4 & 0x3F) << 6)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1505 | (c5 & 0x3F));
88669
0bc5868f9f61 (decode_coding_utf_8): Reject overlong sequences.
Dave Love <fx@gnu.org>
parents: 88646
diff changeset
1506 if ((c > MAX_CHAR) || (c < 0x200000))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1507 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1508 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1509 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1510 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1511 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1512 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1513 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1514 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1515
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1516 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1517 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1518
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1519 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1520 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1521 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1522 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1523 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1524 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1525 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1526
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1527 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1528 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1529 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1530 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1531 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1532
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1533
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1534 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1535 encode_coding_utf_8 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1536 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1537 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1538 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1539 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1540 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1541 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1542 unsigned char *dst_end = coding->destination + coding->dst_bytes;
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1543 int produced_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1544 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1545
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1546 if (CODING_UTF_8_BOM (coding) == utf_with_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1547 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1548 ASSURE_DESTINATION (3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1549 EMIT_THREE_BYTES (UTF_8_BOM_1, UTF_8_BOM_2, UTF_8_BOM_3);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1550 CODING_UTF_8_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1551 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1552
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1553 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1554 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1555 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1556
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1557 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1558 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1559 unsigned char str[MAX_MULTIBYTE_LENGTH], *p, *pend = str;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1560
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1561 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1562 c = *charbuf++;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1563 if (CHAR_BYTE8_P (c))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1564 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1565 c = CHAR_TO_BYTE8 (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1566 EMIT_ONE_BYTE (c);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1567 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1568 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1569 {
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1570 CHAR_STRING_ADVANCE_NO_UNIFY (c, pend);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1571 for (p = str; p < pend; p++)
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1572 EMIT_ONE_BYTE (*p);
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
1573 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1574 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1575 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1576 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1577 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1578 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1579
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1580 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1581 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1582 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1583 c = *charbuf++;
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1584 if (CHAR_BYTE8_P (c))
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1585 *dst++ = CHAR_TO_BYTE8 (c);
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
1586 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
1587 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1588 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1589 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1590 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1591 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1592 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1593 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1594 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1595 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1596
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1597
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1598 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1599 Check if a text is encoded in one of UTF-16 based coding systems.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1600 If it is, return 1, else return 0. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1601
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1602 #define UTF_16_HIGH_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1603 (((val) & 0xFC00) == 0xD800)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1604
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1605 #define UTF_16_LOW_SURROGATE_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1606 (((val) & 0xFC00) == 0xDC00)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1607
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1608 #define UTF_16_INVALID_P(val) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1609 (((val) == 0xFFFE) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1610 || ((val) == 0xFFFF) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1611 || UTF_16_LOW_SURROGATE_P (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1612
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1613
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1614 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1615 detect_coding_utf_16 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1616 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1617 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1618 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1619 const unsigned char *src = coding->source, *src_base = src;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1620 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1621 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1622 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1623 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1624
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1625 detect_info->checked |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1626 if (coding->mode & CODING_MODE_LAST_BLOCK
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1627 && (coding->src_chars & 1))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1628 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1629 detect_info->rejected |= CATEGORY_MASK_UTF_16;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1630 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1631 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1632
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1633 TWO_MORE_BYTES (c1, c2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1634 if ((c1 == 0xFF) && (c2 == 0xFE))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1635 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1636 detect_info->found |= (CATEGORY_MASK_UTF_16_LE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1637 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1638 detect_info->rejected |= (CATEGORY_MASK_UTF_16_BE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1639 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1640 | CATEGORY_MASK_UTF_16_LE_NOSIG);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1641 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1642 else if ((c1 == 0xFE) && (c2 == 0xFF))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1643 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1644 detect_info->found |= (CATEGORY_MASK_UTF_16_BE
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1645 | CATEGORY_MASK_UTF_16_AUTO);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1646 detect_info->rejected |= (CATEGORY_MASK_UTF_16_LE
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1647 | CATEGORY_MASK_UTF_16_BE_NOSIG
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1648 | CATEGORY_MASK_UTF_16_LE_NOSIG);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1649 }
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
1650 else if (c2 < 0)
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1651 {
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1652 detect_info->rejected |= CATEGORY_MASK_UTF_16;
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1653 return 0;
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1654 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1655 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1656 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1657 /* We check the dispersion of Eth and Oth bytes where E is even and
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1658 O is odd. If both are high, we assume binary data.*/
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1659 unsigned char e[256], o[256];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1660 unsigned e_num = 1, o_num = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1661
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1662 memset (e, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1663 memset (o, 0, 256);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1664 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1665 o[c2] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1666
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1667 detect_info->rejected
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1668 |= (CATEGORY_MASK_UTF_16_BE | CATEGORY_MASK_UTF_16_LE);
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1669
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1670 while (1)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1671 {
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1672 TWO_MORE_BYTES (c1, c2);
101174
198d8bf06a4f Fix previous changes.
Kenichi Handa <handa@m17n.org>
parents: 101172
diff changeset
1673 if (c2 < 0)
101172
674e67257137 (TWO_MORE_BYTES): New macro.
Kenichi Handa <handa@m17n.org>
parents: 101040
diff changeset
1674 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1675 if (! e[c1])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1676 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1677 e[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1678 e_num++;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1679 if (e_num >= 128)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1680 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1681 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1682 if (! o[c2])
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1683 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1684 o[c1] = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1685 o_num++;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1686 if (o_num >= 128)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1687 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1688 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1689 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1690 detect_info->rejected |= CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1691 return 0;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1692 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
1693
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
1694 no_more_source:
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
1695 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1696 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1697
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1698 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1699 decode_coding_utf_16 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1700 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1701 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1702 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1703 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1704 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
1705 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1706 /* We may produces at most 3 chars in one loop. */
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1707 int *charbuf_end = coding->charbuf + coding->charbuf_size - 2;
100131
0e4115b39b5d (decode_coding_utf_16): Initialize consumed_chars_base
Kenichi Handa <handa@m17n.org>
parents: 99753
diff changeset
1708 int consumed_chars = 0, consumed_chars_base = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1709 int multibytep = coding->src_multibyte;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1710 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1711 enum utf_16_endian_type endian = CODING_UTF_16_ENDIAN (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1712 int surrogate = CODING_UTF_16_SURROGATE (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1713 Lisp_Object attr, charset_list;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1714 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
1715 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1716 int byte_after_cr1 = -1, byte_after_cr2 = -1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1717
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1718 CODING_GET_INFO (coding, attr, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1719
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1720 if (bom == utf_with_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1721 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1722 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1723
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1724 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1725 ONE_MORE_BYTE (c1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1726 ONE_MORE_BYTE (c2);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1727 c = (c1 << 8) | c2;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1728
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1729 if (endian == utf_16_big_endian
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1730 ? c != 0xFEFF : c != 0xFFFE)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1731 {
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1732 /* The first two bytes are not BOM. Treat them as bytes
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1733 for a normal character. */
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1734 src = src_base;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1735 coding->errors++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1736 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1737 CODING_UTF_16_BOM (coding) = utf_without_bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1738 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1739 else if (bom == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1740 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1741 /* We have already tried to detect BOM and failed in
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
1742 detect_coding. */
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1743 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1744 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1745
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1746 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1747 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1748 int c, c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1749
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1750 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1751 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1752
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
1753 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1754 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1755 if (byte_after_cr1 >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1756 src_base -= 2;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1757 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
1758 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1759
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1760 if (byte_after_cr1 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1761 c1 = byte_after_cr1, byte_after_cr1 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1762 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1763 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1764 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1765 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1766 *charbuf++ = -c1;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1767 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1768 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1769 if (byte_after_cr2 >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1770 c2 = byte_after_cr2, byte_after_cr2 = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1771 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1772 ONE_MORE_BYTE (c2);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1773 if (c2 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1774 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1775 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1776 *charbuf++ = -c2;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1777 continue;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1778 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1779 c = (endian == utf_16_big_endian
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1780 ? ((c1 << 8) | c2) : ((c2 << 8) | c1));
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1781
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1782 if (surrogate)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1783 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1784 if (! UTF_16_LOW_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1785 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1786 if (endian == utf_16_big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1787 c1 = surrogate >> 8, c2 = surrogate & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1788 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1789 c1 = surrogate & 0xFF, c2 = surrogate >> 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1790 *charbuf++ = c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1791 *charbuf++ = c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1792 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1793 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1794 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1795 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1796 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1797 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1798 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1799 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1800 c = ((surrogate - 0xD800) << 10) | (c - 0xDC00);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1801 CODING_UTF_16_SURROGATE (coding) = surrogate = 0;
89842
b5f22f538c1f (decode_coding_utf_16): Fix handling of surrogate pare.
Kenichi Handa <handa@m17n.org>
parents: 89780
diff changeset
1802 *charbuf++ = 0x10000 + c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1803 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1804 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1805 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1806 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1807 if (UTF_16_HIGH_SURROGATE_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1808 CODING_UTF_16_SURROGATE (coding) = surrogate = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1809 else
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1810 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1811 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1812 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1813 ONE_MORE_BYTE (byte_after_cr1);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1814 ONE_MORE_BYTE (byte_after_cr2);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1815 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1816 *charbuf++ = c;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
1817 }
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
1818 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1819 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1820
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1821 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1822 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1823 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1824 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1825 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1826
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1827 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1828 encode_coding_utf_16 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1829 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1830 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1831 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1832 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1833 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1834 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1835 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1836 int safe_room = 8;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1837 enum utf_bom_type bom = CODING_UTF_16_BOM (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1838 int big_endian = CODING_UTF_16_ENDIAN (coding) == utf_16_big_endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1839 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1840 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1841 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1842
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
1843 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1844
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1845 if (bom != utf_without_bom)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1846 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1847 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1848 if (big_endian)
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1849 EMIT_TWO_BYTES (0xFE, 0xFF);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1850 else
89404
3e1d187b52c3 (Qutf_16_be_nosig, Qutf_16_be, Qutf_16_le_nosig)
Kenichi Handa <handa@m17n.org>
parents: 89394
diff changeset
1851 EMIT_TWO_BYTES (0xFF, 0xFE);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
1852 CODING_UTF_16_BOM (coding) = utf_without_bom;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1853 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1854
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1855 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1856 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1857 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1858 c = *charbuf++;
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1859 if (c >= MAX_UNICODE_CHAR)
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
1860 c = coding->default_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1861
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1862 if (c < 0x10000)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1863 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1864 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1865 EMIT_TWO_BYTES (c >> 8, c & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1866 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1867 EMIT_TWO_BYTES (c & 0xFF, c >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1868 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1869 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1870 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1871 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1872
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1873 c -= 0x10000;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1874 c1 = (c >> 10) + 0xD800;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1875 c2 = (c & 0x3FF) + 0xDC00;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1876 if (big_endian)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1877 EMIT_FOUR_BYTES (c1 >> 8, c1 & 0xFF, c2 >> 8, c2 & 0xFF);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1878 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1879 EMIT_FOUR_BYTES (c1 & 0xFF, c1 >> 8, c2 & 0xFF, c2 >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1880 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1881 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
1882 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1883 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1884 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1885 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1886 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1887
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1888
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1889 /*** 6. Old Emacs' internal format (emacs-mule) ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1890
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1891 /* Emacs' internal format for representation of multiple character
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1892 sets is a kind of multi-byte encoding, i.e. characters are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1893 represented by variable-length sequences of one-byte codes.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1894
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1895 ASCII characters and control characters (e.g. `tab', `newline') are
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1896 represented by one-byte sequences which are their ASCII codes, in
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1897 the range 0x00 through 0x7F.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1898
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1899 8-bit characters of the range 0x80..0x9F are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1900 two-byte sequences of LEADING_CODE_8_BIT_CONTROL and (their 8-bit
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1901 code + 0x20).
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1902
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1903 8-bit characters of the range 0xA0..0xFF are represented by
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1904 one-byte sequences which are their 8-bit code.
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1905
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1906 The other characters are represented by a sequence of `base
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1907 leading-code', optional `extended leading-code', and one or two
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1908 `position-code's. The length of the sequence is determined by the
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1909 base leading-code. Leading-code takes the range 0x81 through 0x9D,
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1910 whereas extended leading-code and position-code take the range 0xA0
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1911 through 0xFF. See `charset.h' for more details about leading-code
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1912 and position-code.
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
1913
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1914 --- CODE RANGE of Emacs' internal format ---
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1915 character set range
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1916 ------------- -----
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1917 ascii 0x00..0x7F
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1918 eight-bit-control LEADING_CODE_8_BIT_CONTROL + 0xA0..0xBF
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
1919 eight-bit-graphic 0xA0..0xBF
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1920 ELSE 0x81..0x9D + [0xA0..0xFF]+
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1921 ---------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1922
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1923 As this is the internal character representation, the format is
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1924 usually not used externally (i.e. in a file or in a data sent to a
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1925 process). But, it is possible to have a text externally in this
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1926 format (i.e. by encoding by the coding system `emacs-mule').
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1927
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1928 In that case, a sequence of one-byte codes has a slightly different
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1929 form.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1930
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1931 At first, all characters in eight-bit-control are represented by
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1932 one-byte sequences which are their 8-bit code.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1933
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1934 Next, character composition data are represented by the byte
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1935 sequence of the form: 0x80 METHOD BYTES CHARS COMPONENT ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1936 where,
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1937 METHOD is 0xF2 plus one of composition method (enum
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1938 composition_method),
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1939
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1940 BYTES is 0xA0 plus a byte length of this composition data,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1941
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1942 CHARS is 0xA0 plus a number of characters composed by this
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1943 data,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1944
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1945 COMPONENTs are characters of multibye form or composition
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1946 rules encoded by two-byte of ASCII codes.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1947
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1948 In addition, for backward compatibility, the following formats are
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1949 also recognized as composition data on decoding.
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1950
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1951 0x80 MSEQ ...
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1952 0x80 0xFF MSEQ RULE MSEQ RULE ... MSEQ
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1953
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1954 Here,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1955 MSEQ is a multibyte form but in these special format:
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1956 ASCII: 0xA0 ASCII_CODE+0x80,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1957 other: LEADING_CODE+0x20 FOLLOWING-BYTE ...,
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1958 RULE is a one byte code of the range 0xA0..0xF0 that
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
1959 represents a composition rule.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1960 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
1961
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1962 char emacs_mule_bytes[256];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
1963
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1964
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1965 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1966 Check if a text is encoded in `emacs-mule'. If it is, return 1,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1967 else return 0. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1968
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1969 static int
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1970 detect_coding_emacs_mule (coding, detect_info)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1971 struct coding_system *coding;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1972 struct coding_detection_info *detect_info;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1973 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1974 const unsigned char *src = coding->source, *src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1975 const unsigned char *src_end = coding->source + coding->src_bytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1976 int multibytep = coding->src_multibyte;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1977 int consumed_chars = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1978 int c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1979 int found = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1980
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1981 detect_info->checked |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1982 /* A coding system of this category is always ASCII compatible. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1983 src += coding->head_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1984
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1985 while (1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1986 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1987 src_base = src;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1988 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1989 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1990 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1991 if (c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1992 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1993 /* Perhaps the start of composite character. We simply skip
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1994 it because analyzing it is too heavy for detecting. But,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1995 at least, we check that the composite character
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1996 constitutes of more than 4 bytes. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1997 const unsigned char *src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1998
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
1999 repeat:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2000 src_base = src;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2001 do
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2002 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2003 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2004 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2005 while (c >= 0xA0);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2006
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2007 if (src - src_base <= 4)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2008 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2009 found = CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2010 if (c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2011 goto repeat;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2012 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2013
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2014 if (c < 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2015 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2016 if (c < 0x20
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2017 && (c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2018 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2019 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2020 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2021 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2022 int more_bytes = emacs_mule_bytes[*src_base] - 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2023
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2024 while (more_bytes > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2025 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2026 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2027 if (c < 0xA0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2028 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2029 src--; /* Unread the last byte. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2030 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2031 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2032 more_bytes--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2033 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2034 if (more_bytes != 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2035 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2036 found = CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2037 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2038 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2039 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2040 return 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2041
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2042 no_more_source:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2043 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2044 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2045 detect_info->rejected |= CATEGORY_MASK_EMACS_MULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2046 return 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2047 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2048 detect_info->found |= found;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2049 return 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2050 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2051
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2052
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2053 /* Parse emacs-mule multibyte sequence at SRC and return the decoded
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2054 character. If CMP_STATUS indicates that we must expect MSEQ or
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2055 RULE described above, decode it and return the negative value of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2056 the deocded character or rule. If an invalid byte is found, return
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2057 -1. If SRC is too short, return -2. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2058
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2059 int
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2060 emacs_mule_char (coding, src, nbytes, nchars, id, cmp_status)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2061 struct coding_system *coding;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2062 const unsigned char *src;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2063 int *nbytes, *nchars, *id;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2064 struct composition_status *cmp_status;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2065 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2066 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2067 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2068 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2069 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2070 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2071 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2072 int consumed_chars = 0;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2073 int mseq_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2074
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2075 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2076 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2077 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2078 c = -c;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2079 charset = emacs_mule_charset[0];
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2080 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2081 else
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2082 {
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2083 if (c >= 0xA0)
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2084 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2085 if (cmp_status->state != COMPOSING_NO
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2086 && cmp_status->old_form)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2087 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2088 if (cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2089 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2090 if (c == 0xA0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2091 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2092 ONE_MORE_BYTE (c);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2093 c -= 0x80;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2094 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2095 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2096 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2097 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2098 c -= 0x20;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2099 mseq_found = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2100 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2101 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2102 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2103 *nbytes = src - src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2104 *nchars = consumed_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2105 return -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2106 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2107 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2108 else
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2109 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2110 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2111
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2112 switch (emacs_mule_bytes[c])
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2113 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2114 case 2:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2115 if (! (charset = emacs_mule_charset[c]))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2116 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2117 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2118 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2119 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2120 code = c & 0x7F;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2121 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2122
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2123 case 3:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2124 if (c == EMACS_MULE_LEADING_CODE_PRIVATE_11
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2125 || c == EMACS_MULE_LEADING_CODE_PRIVATE_12)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2126 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2127 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2128 if (c < 0xA0 || ! (charset = emacs_mule_charset[c]))
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2129 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2130 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2131 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2132 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2133 code = c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2134 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2135 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2136 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2137 if (! (charset = emacs_mule_charset[c]))
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2138 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2139 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2140 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2141 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2142 code = (c & 0x7F) << 8;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2143 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2144 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2145 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2146 code |= c & 0x7F;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2147 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2148 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2149
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2150 case 4:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2151 ONE_MORE_BYTE (c);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2152 if (c < 0 || ! (charset = emacs_mule_charset[c]))
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2153 goto invalid_code;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2154 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2155 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2156 goto invalid_code;
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2157 code = (c & 0x7F) << 8;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2158 ONE_MORE_BYTE (c);
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
2159 if (c < 0xA0)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2160 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2161 code |= c & 0x7F;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2162 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2163
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2164 case 1:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2165 code = c;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2166 charset = CHARSET_FROM_ID (ASCII_BYTE_P (code)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2167 ? charset_ascii : charset_eight_bit);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2168 break;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2169
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2170 default:
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2171 abort ();
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2172 }
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2173 c = DECODE_CHAR (charset, code);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2174 if (c < 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2175 goto invalid_code;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2176 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2177 *nbytes = src - src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2178 *nchars = consumed_chars;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2179 if (id)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2180 *id = charset->id;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2181 return (mseq_found ? -c : c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2182
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2183 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2184 return -2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2185
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2186 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2187 return -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2188 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2189
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2190
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2191 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2192
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2193 /* Handle these composition sequence ('|': the end of header elements,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2194 BYTES and CHARS >= 0xA0):
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2195
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2196 (1) relative composition: 0x80 0xF2 BYTES CHARS | CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2197 (2) altchar composition: 0x80 0xF4 BYTES CHARS | ALT ... ALT CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2198 (3) alt&rule composition: 0x80 0xF5 BYTES CHARS | ALT RULE ... ALT CHAR ...
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2199
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2200 and these old form:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2201
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2202 (4) relative composition: 0x80 | MSEQ ... MSEQ
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2203 (5) rulebase composition: 0x80 0xFF | MSEQ MRULE ... MSEQ
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2204
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2205 When the starter 0x80 and the following header elements are found,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2206 this annotation header is produced.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2207
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2208 [ -LENGTH(==-5) CODING_ANNOTATE_COMPOSITION_MASK NCHARS NBYTES METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2209
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2210 NCHARS is CHARS - 0xA0 for (1), (2), (3), and 0 for (4), (5).
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2211 NBYTES is BYTES - 0xA0 for (1), (2), (3), and 0 for (4), (5).
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2212
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2213 Then, upon reading the following elements, these codes are produced
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2214 until the composition end is found:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2215
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2216 (1) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2217 (2) ALT ... ALT CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2218 (3) ALT -2 DECODED-RULE ALT -2 DECODED-RULE ... ALT CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2219 (4) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2220 (5) CHAR -2 DECODED-RULE CHAR -2 DECODED-RULE ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2221
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2222 When the composition end is found, LENGTH and NCHARS in the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2223 annotation header is updated as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2224
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2225 (1) LENGTH: unchanged, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2226 (2) LENGTH: length of the whole sequence minus NCHARS, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2227 (3) LENGTH: length of the whole sequence minus NCHARS, NCHARS: unchanged
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2228 (4) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2229 (5) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2230
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2231 If an error is found while composing, the annotation header is
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2232 changed to the original composition header (plus filler -1s) as
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2233 below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2234
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2235 (1),(2),(3) [ 0x80 0xF2+METHOD BYTES CHARS -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2236 (5) [ 0x80 0xFF -1 -1- -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2237
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2238 and the sequence [ -2 DECODED-RULE ] is changed to the original
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2239 byte sequence as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2240 o the original byte sequence is B: [ B -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2241 o the original byte sequence is B1 B2: [ B1 B2 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2242
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2243 Most of the routines are implemented by macros because many
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2244 variables and labels in the caller decode_coding_emacs_mule must be
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2245 accessible, and they are usually called just once (thus doesn't
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2246 increase the size of compiled object). */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2247
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2248 /* Decode a composition rule represented by C as a component of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2249 composition sequence of Emacs 20 style. Set RULE to the decoded
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2250 rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2251
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2252 #define DECODE_EMACS_MULE_COMPOSITION_RULE_20(c, rule) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2253 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2254 int gref, nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2255 \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2256 c -= 0xA0; \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2257 if (c < 0 || c >= 81) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2258 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2259 gref = c / 9, nref = c % 9; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2260 if (gref == 4) gref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2261 if (nref == 4) nref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2262 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2263 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2264
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2265
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2266 /* Decode a composition rule represented by C and the following byte
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2267 at SRC as a component of composition sequence of Emacs 21 style.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2268 Set RULE to the decoded rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2269
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2270 #define DECODE_EMACS_MULE_COMPOSITION_RULE_21(c, rule) \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2271 do { \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2272 int gref, nref; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2273 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2274 gref = c - 0x20; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2275 if (gref < 0 || gref >= 81) \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2276 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2277 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2278 nref = c - 0x20; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2279 if (nref < 0 || nref >= 81) \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2280 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2281 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2282 } while (0)
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2283
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2284
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2285 /* Start of Emacs 21 style format. The first three bytes at SRC are
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2286 (METHOD - 0xF2), (BYTES - 0xA0), (CHARS - 0xA0), where BYTES is the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2287 byte length of this composition information, CHARS is the number of
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2288 characters composed by this composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2289
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2290 #define DECODE_EMACS_MULE_21_COMPOSITION() \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2291 do { \
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2292 enum composition_method method = c - 0xF2; \
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
2293 int *charbuf_base = charbuf; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2294 int nbytes, nchars; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2295 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2296 ONE_MORE_BYTE (c); \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2297 if (c < 0) \
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2298 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2299 nbytes = c - 0xA0; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2300 if (nbytes < 3 || (method == COMPOSITION_RELATIVE && nbytes != 4)) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2301 goto invalid_code; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2302 ONE_MORE_BYTE (c); \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2303 nchars = c - 0xA0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2304 if (nchars <= 0 || nchars >= MAX_COMPOSITION_COMPONENTS) \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2305 goto invalid_code; \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2306 cmp_status->old_form = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2307 cmp_status->method = method; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2308 if (method == COMPOSITION_RELATIVE) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2309 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2310 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2311 cmp_status->state = COMPOSING_COMPONENT_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2312 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2313 cmp_status->nchars = nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2314 cmp_status->ncomps = nbytes - 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2315 ADD_COMPOSITION_DATA (charbuf, nchars, nbytes, method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2316 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2317
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2318
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2319 /* Start of Emacs 20 style format for relative composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2320
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2321 #define DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2322 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2323 cmp_status->old_form = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2324 cmp_status->method = COMPOSITION_RELATIVE; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2325 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2326 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2327 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2328 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2329 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2330
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2331
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2332 /* Start of Emacs 20 style format for rule-base composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2333
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2334 #define DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2335 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2336 cmp_status->old_form = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2337 cmp_status->method = COMPOSITION_WITH_RULE; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2338 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2339 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2340 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2341 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2342 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2343
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2344
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2345 #define DECODE_EMACS_MULE_COMPOSITION_START() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2346 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2347 const unsigned char *current_src = src; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2348 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2349 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2350 if (c < 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2351 goto invalid_code; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2352 if (c - 0xF2 >= COMPOSITION_RELATIVE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2353 && c - 0xF2 <= COMPOSITION_WITH_RULE_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2354 DECODE_EMACS_MULE_21_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2355 else if (c < 0xA0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2356 goto invalid_code; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2357 else if (c < 0xC0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2358 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2359 DECODE_EMACS_MULE_20_RELATIVE_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2360 /* Re-read C as a composition component. */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2361 src = current_src; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2362 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2363 else if (c == 0xFF) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2364 DECODE_EMACS_MULE_20_RULEBASE_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2365 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2366 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2367 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2368
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2369 #define EMACS_MULE_COMPOSITION_END() \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2370 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2371 int idx = - cmp_status->length; \
90354
450fb16a4bf4 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90350
diff changeset
2372 \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2373 if (cmp_status->old_form) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2374 charbuf[idx + 2] = cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2375 else if (cmp_status->method > COMPOSITION_RELATIVE) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2376 charbuf[idx] = charbuf[idx + 2] - cmp_status->length; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2377 cmp_status->state = COMPOSING_NO; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2378 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2379
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2380
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2381 static int
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2382 emacs_mule_finish_composition (charbuf, cmp_status)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2383 int *charbuf;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2384 struct composition_status *cmp_status;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2385 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2386 int idx = - cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2387 int new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2388
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2389 if (cmp_status->old_form && cmp_status->nchars > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2390 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2391 charbuf[idx + 2] = cmp_status->nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2392 new_chars = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2393 if (cmp_status->method == COMPOSITION_WITH_RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2394 && cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2395 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2396 /* The last rule was invalid. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2397 int rule = charbuf[-1] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2398
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2399 charbuf[-2] = BYTE8_TO_CHAR (rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2400 charbuf[-1] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2401 new_chars = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2402 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2403 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2404 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2405 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2406 charbuf[idx++] = BYTE8_TO_CHAR (0x80);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2407
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2408 if (cmp_status->method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2409 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2410 charbuf[idx++] = BYTE8_TO_CHAR (0xFF);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2411 charbuf[idx++] = -3;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2412 charbuf[idx++] = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2413 new_chars = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2414 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2415 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2416 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2417 int nchars = charbuf[idx + 1] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2418 int nbytes = charbuf[idx + 2] + 0xA0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2419
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2420 charbuf[idx++] = BYTE8_TO_CHAR (0xF2 + cmp_status->method);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2421 charbuf[idx++] = BYTE8_TO_CHAR (nbytes);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2422 charbuf[idx++] = BYTE8_TO_CHAR (nchars);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2423 charbuf[idx++] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2424 new_chars = 4;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2425 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2426 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2427 cmp_status->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2428 return new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2429 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2430
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2431 #define EMACS_MULE_MAYBE_FINISH_COMPOSITION() \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2432 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2433 if (cmp_status->state != COMPOSING_NO) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2434 char_offset += emacs_mule_finish_composition (charbuf, cmp_status); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2435 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2436
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2437
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2438 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2439 decode_coding_emacs_mule (coding)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2440 struct coding_system *coding;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2441 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2442 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
2443 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
2444 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2445 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
2446 /* We may produce two annocations (charset and composition) in one
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
2447 loop and one more charset annocation at the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2448 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
2449 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 3);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2450 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2451 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2452 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2453 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2454 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2455 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
2456 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
2457 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2458 int byte_after_cr = -1;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2459 struct composition_status *cmp_status = &coding->spec.emacs_mule.cmp_status;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2460
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2461 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2462
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2463 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2464 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2465 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2466
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2467 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2468 *charbuf++ = cmp_status->carryover[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2469 coding->annotated = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2470 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2471
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2472 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2473 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2474 int c, id;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2475
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2476 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2477 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2478
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2479 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2480 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2481 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2482 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2483 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
2484 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2485
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2486 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2487 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2488 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2489 ONE_MORE_BYTE (c);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2490
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2491 if (c < 0 || c == 0x80)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2492 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2493 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2494 if (c < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2495 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2496 *charbuf++ = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2497 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2498 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2499 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2500 DECODE_EMACS_MULE_COMPOSITION_START ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2501 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2502 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2503
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2504 if (c < 0x80)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2505 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2506 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
2507 ONE_MORE_BYTE (byte_after_cr);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2508 id = charset_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2509 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2510 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2511 if (cmp_status->old_form)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2512 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2513 else if (cmp_status->state >= COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2514 cmp_status->ncomps--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2515 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2516 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2517 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2518 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2519 int nchars, nbytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2520
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2521 c = emacs_mule_char (coding, src_base, &nbytes, &nchars, &id,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2522 cmp_status);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2523 if (c < 0)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2524 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2525 if (c == -1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2526 goto invalid_code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2527 if (c == -2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2528 break;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2529 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2530 src = src_base + nbytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2531 consumed_chars = consumed_chars_base + nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2532 if (cmp_status->state >= COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2533 cmp_status->ncomps -= nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2534 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2535
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2536 /* Now if C >= 0, we found a normally encoded characer, if C <
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2537 0, we found an old-style composition component character or
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2538 rule. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2539
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2540 if (cmp_status->state == COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2541 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2542 if (last_id != id)
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2543 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2544 if (last_id != charset_ascii)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2545 ADD_CHARSET_DATA (charbuf, char_offset - last_offset,
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2546 last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2547 last_id = id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2548 last_offset = char_offset;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2549 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2550 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2551 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2552 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2553 else if (cmp_status->state == COMPOSING_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2554 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2555 if (cmp_status->old_form)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2556 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2557 if (c >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2558 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2559 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2560 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2561 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2562 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2563 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2564 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2565 *charbuf++ = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2566 cmp_status->nchars++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2567 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2568 if (cmp_status->nchars == MAX_COMPOSITION_COMPONENTS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2569 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2570 else if (cmp_status->method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2571 cmp_status->state = COMPOSING_RULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2572 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2573 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2574 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2575 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2576 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2577 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2578 cmp_status->nchars--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2579 if (cmp_status->nchars == 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2580 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2581 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2582 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2583 else if (cmp_status->state == COMPOSING_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2584 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2585 int rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2586
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2587 if (c >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2588 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2589 EMACS_MULE_COMPOSITION_END ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2590 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2591 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2592 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2593 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2594 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2595 c = -c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2596 DECODE_EMACS_MULE_COMPOSITION_RULE_20 (c, rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2597 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2598 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2599 *charbuf++ = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2600 *charbuf++ = rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2601 cmp_status->length += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2602 cmp_status->state = COMPOSING_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2603 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2604 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2605 else if (cmp_status->state == COMPOSING_COMPONENT_CHAR)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2606 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2607 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2608 cmp_status->length++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2609 if (cmp_status->ncomps == 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2610 cmp_status->state = COMPOSING_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2611 else if (cmp_status->ncomps > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2612 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2613 if (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2614 cmp_status->state = COMPOSING_COMPONENT_RULE;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2615 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2616 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2617 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2618 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2619 else /* COMPOSING_COMPONENT_RULE */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2620 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2621 int rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2622
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2623 DECODE_EMACS_MULE_COMPOSITION_RULE_21 (c, rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2624 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2625 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2626 *charbuf++ = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2627 *charbuf++ = rule;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2628 cmp_status->length += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2629 cmp_status->ncomps--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2630 if (cmp_status->ncomps > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2631 cmp_status->state = COMPOSING_COMPONENT_CHAR;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2632 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2633 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2634 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2635 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2636
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2637 retry:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2638 src = src_base;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2639 consumed_chars = consumed_chars_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2640 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2641
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2642 invalid_code:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2643 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2644 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2645 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2646 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2647 *charbuf++ = ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2648 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2649 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2650 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2651
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2652 no_more_source:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2653 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2654 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2655 if (coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2656 EMACS_MULE_MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2657 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2658 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2659 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2660
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2661 charbuf -= cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2662 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2663 cmp_status->carryover[i] = charbuf[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2664 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
2665 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2666 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
2667 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2668 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2669 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2670 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2671 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2672
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2673
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2674 #define EMACS_MULE_LEADING_CODES(id, codes) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2675 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2676 if (id < 0xA0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2677 codes[0] = id, codes[1] = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2678 else if (id < 0xE0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2679 codes[0] = 0x9A, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2680 else if (id < 0xF0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2681 codes[0] = 0x9B, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2682 else if (id < 0xF5) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2683 codes[0] = 0x9C, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2684 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2685 codes[0] = 0x9D, codes[1] = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2686 } while (0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2687
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2688
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2689 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2690 encode_coding_emacs_mule (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2691 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2692 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2693 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2694 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2695 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2696 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2697 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2698 int safe_room = 8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2699 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2700 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2701 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2702 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2703
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
2704 CODING_GET_INFO (coding, attrs, charset_list);
89644
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2705 if (! EQ (charset_list, Vemacs_mule_charset_list))
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2706 {
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2707 CODING_ATTR_CHARSET_LIST (attrs)
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2708 = charset_list = Vemacs_mule_charset_list;
fc9cda144ffc (encode_coding_emacs_mule): Resync charset_list to
Kenichi Handa <handa@m17n.org>
parents: 89642
diff changeset
2709 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2710
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2711 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2712 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2713 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2714 c = *charbuf++;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2715
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2716 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2717 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2718 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2719 switch (*charbuf)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2720 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2721 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2722 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2723 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2724 case CODING_ANNOTATE_CHARSET_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2725 preferred_charset_id = charbuf[3];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2726 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2727 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2728 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2729 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2730 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2731 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2732 abort ();
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2733 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2734 charbuf += -c - 1;
32806
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2735 continue;
9502d0a5b2ad (decode_coding_emacs_mule): If coding->eol_type is CR
Eli Zaretskii <eliz@gnu.org>
parents: 32745
diff changeset
2736 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2737
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2738 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2739 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2740 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2741 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2742 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
2743 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2744 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2745 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2746 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2747 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2748 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2749 int dimension;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2750 int emacs_mule_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2751 unsigned char leading_codes[2];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2752
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2753 if (preferred_charset_id >= 0)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2754 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2755 charset = CHARSET_FROM_ID (preferred_charset_id);
100176
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2756 if (CHAR_CHARSET_P (c, charset))
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2757 code = ENCODE_CHAR (charset, c);
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2758 else
5706ca7c3d02 (encode_coding_emacs_mule): Be sure to set `code'.
Kenichi Handa <handa@m17n.org>
parents: 100170
diff changeset
2759 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2760 }
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2761 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
2762 charset = char_charset (c, charset_list, &code);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2763 if (! charset)
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2764 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2765 c = coding->default_char;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2766 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2767 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2768 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2769 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2770 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2771 charset = char_charset (c, charset_list, &code);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2772 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2773 dimension = CHARSET_DIMENSION (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2774 emacs_mule_id = CHARSET_EMACS_MULE_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2775 EMACS_MULE_LEADING_CODES (emacs_mule_id, leading_codes);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2776 EMIT_ONE_BYTE (leading_codes[0]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2777 if (leading_codes[1])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2778 EMIT_ONE_BYTE (leading_codes[1]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2779 if (dimension == 1)
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2780 EMIT_ONE_BYTE (code | 0x80);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2781 else
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2782 {
89642
e97441b6244b (encode_coding_emacs_mule): Emit bytes with MSB.
Kenichi Handa <handa@m17n.org>
parents: 89575
diff changeset
2783 code |= 0x8080;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2784 EMIT_ONE_BYTE (code >> 8);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2785 EMIT_ONE_BYTE (code & 0xFF);
54320
a7e59b39de35 (decode_coding_emacs_mule): Handle insufficent source correctly.
Kenichi Handa <handa@m17n.org>
parents: 54303
diff changeset
2786 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2787 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2788 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
2789 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2790 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2791 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2792 return 0;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
2793 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2794
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2795
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2796 /*** 7. ISO2022 handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2797
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2798 /* The following note describes the coding system ISO2022 briefly.
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2799 Since the intention of this note is to help understand the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2800 functions in this file, some parts are NOT ACCURATE or are OVERLY
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2801 SIMPLIFIED. For thorough understanding, please refer to the
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2802 original document of ISO2022. This is equivalent to the standard
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2803 ECMA-35, obtainable from <URL:http://www.ecma.ch/> (*).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2804
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2805 ISO2022 provides many mechanisms to encode several character sets
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2806 in 7-bit and 8-bit environments. For 7-bit environments, all text
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2807 is encoded using bytes less than 128. This may make the encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2808 text a little bit longer, but the text passes more easily through
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2809 several types of gateway, some of which strip off the MSB (Most
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2810 Significant Bit).
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2811
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2812 There are two kinds of character sets: control character sets and
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2813 graphic character sets. The former contain control characters such
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2814 as `newline' and `escape' to provide control functions (control
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2815 functions are also provided by escape sequences). The latter
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2816 contain graphic characters such as 'A' and '-'. Emacs recognizes
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2817 two control character sets and many graphic character sets.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2818
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2819 Graphic character sets are classified into one of the following
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2820 four classes, according to the number of bytes (DIMENSION) and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2821 number of characters in one dimension (CHARS) of the set:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2822 - DIMENSION1_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2823 - DIMENSION1_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2824 - DIMENSION2_CHARS94
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2825 - DIMENSION2_CHARS96
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2826
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2827 In addition, each character set is assigned an identification tag,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2828 unique for each set, called the "final character" (denoted as <F>
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2829 hereafter). The <F> of each character set is decided by ECMA(*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2830 when it is registered in ISO. The code range of <F> is 0x30..0x7F
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2831 (0x30..0x3F are for private use only).
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2832
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2833 Note (*): ECMA = European Computer Manufacturers Association
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2834
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2835 Here are examples of graphic character sets [NAME(<F>)]:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2836 o DIMENSION1_CHARS94 -- ASCII('B'), right-half-of-JISX0201('I'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2837 o DIMENSION1_CHARS96 -- right-half-of-ISO8859-1('A'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2838 o DIMENSION2_CHARS94 -- GB2312('A'), JISX0208('B'), ...
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2839 o DIMENSION2_CHARS96 -- none for the moment
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2840
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2841 A code area (1 byte=8 bits) is divided into 4 areas, C0, GL, C1, and GR.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2842 C0 [0x00..0x1F] -- control character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2843 GL [0x20..0x7F] -- graphic character plane 0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2844 C1 [0x80..0x9F] -- control character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2845 GR [0xA0..0xFF] -- graphic character plane 1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2846
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2847 A control character set is directly designated and invoked to C0 or
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2848 C1 by an escape sequence. The most common case is that:
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2849 - ISO646's control character set is designated/invoked to C0, and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2850 - ISO6429's control character set is designated/invoked to C1,
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2851 and usually these designations/invocations are omitted in encoded
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2852 text. In a 7-bit environment, only C0 can be used, and a control
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2853 character for C1 is encoded by an appropriate escape sequence to
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2854 fit into the environment. All control characters for C1 are
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2855 defined to have corresponding escape sequences.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2856
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2857 A graphic character set is at first designated to one of four
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2858 graphic registers (G0 through G3), then these graphic registers are
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2859 invoked to GL or GR. These designations and invocations can be
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2860 done independently. The most common case is that G0 is invoked to
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2861 GL, G1 is invoked to GR, and ASCII is designated to G0. Usually
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2862 these invocations and designations are omitted in encoded text.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2863 In a 7-bit environment, only GL can be used.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2864
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2865 When a graphic character set of CHARS94 is invoked to GL, codes
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2866 0x20 and 0x7F of the GL area work as control characters SPACE and
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2867 DEL respectively, and codes 0xA0 and 0xFF of the GR area should not
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2868 be used.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2869
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2870 There are two ways of invocation: locking-shift and single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2871 With locking-shift, the invocation lasts until the next different
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2872 invocation, whereas with single-shift, the invocation affects the
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2873 following character only and doesn't affect the locking-shift
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2874 state. Invocations are done by the following control characters or
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2875 escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2876
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2877 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2878 abbrev function cntrl escape seq description
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2879 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2880 SI/LS0 (shift-in) 0x0F none invoke G0 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2881 SO/LS1 (shift-out) 0x0E none invoke G1 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2882 LS2 (locking-shift-2) none ESC 'n' invoke G2 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2883 LS3 (locking-shift-3) none ESC 'o' invoke G3 into GL
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2884 LS1R (locking-shift-1 right) none ESC '~' invoke G1 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2885 LS2R (locking-shift-2 right) none ESC '}' invoke G2 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2886 LS3R (locking-shift 3 right) none ESC '|' invoke G3 into GR (*)
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2887 SS2 (single-shift-2) 0x8E ESC 'N' invoke G2 for one char
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2888 SS3 (single-shift-3) 0x8F ESC 'O' invoke G3 for one char
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2889 ----------------------------------------------------------------------
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2890 (*) These are not used by any known coding system.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2891
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2892 Control characters for these functions are defined by macros
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2893 ISO_CODE_XXX in `coding.h'.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2894
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2895 Designations are done by the following escape sequences:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2896 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2897 escape sequence description
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2898 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2899 ESC '(' <F> designate DIMENSION1_CHARS94<F> to G0
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2900 ESC ')' <F> designate DIMENSION1_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2901 ESC '*' <F> designate DIMENSION1_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2902 ESC '+' <F> designate DIMENSION1_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2903 ESC ',' <F> designate DIMENSION1_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2904 ESC '-' <F> designate DIMENSION1_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2905 ESC '.' <F> designate DIMENSION1_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2906 ESC '/' <F> designate DIMENSION1_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2907 ESC '$' '(' <F> designate DIMENSION2_CHARS94<F> to G0 (**)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2908 ESC '$' ')' <F> designate DIMENSION2_CHARS94<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2909 ESC '$' '*' <F> designate DIMENSION2_CHARS94<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2910 ESC '$' '+' <F> designate DIMENSION2_CHARS94<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2911 ESC '$' ',' <F> designate DIMENSION2_CHARS96<F> to G0 (*)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2912 ESC '$' '-' <F> designate DIMENSION2_CHARS96<F> to G1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2913 ESC '$' '.' <F> designate DIMENSION2_CHARS96<F> to G2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2914 ESC '$' '/' <F> designate DIMENSION2_CHARS96<F> to G3
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2915 ----------------------------------------------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2916
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2917 In this list, "DIMENSION1_CHARS94<F>" means a graphic character set
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2918 of dimension 1, chars 94, and final character <F>, etc...
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2919
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2920 Note (*): Although these designations are not allowed in ISO2022,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2921 Emacs accepts them on decoding, and produces them on encoding
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2922 CHARS96 character sets in a coding system which is characterized as
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2923 7-bit environment, non-locking-shift, and non-single-shift.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2924
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2925 Note (**): If <F> is '@', 'A', or 'B', the intermediate character
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2926 '(' must be omitted. We refer to this as "short-form" hereafter.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2927
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2928 Now you may notice that there are a lot of ways of encoding the
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2929 same multilingual text in ISO2022. Actually, there exist many
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2930 coding systems such as Compound Text (used in X11's inter client
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2931 communication, ISO-2022-JP (used in Japanese Internet), ISO-2022-KR
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2932 (used in Korean Internet), EUC (Extended UNIX Code, used in Asian
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2933 localized platforms), and all of these are variants of ISO2022.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2934
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2935 In addition to the above, Emacs handles two more kinds of escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2936 sequences: ISO6429's direction specification and Emacs' private
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2937 sequence for specifying character composition.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2938
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2939 ISO6429's direction specification takes the following form:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2940 o CSI ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2941 o CSI '0' ']' -- end of the current direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2942 o CSI '1' ']' -- start of left-to-right text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2943 o CSI '2' ']' -- start of right-to-left text
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2944 The control character CSI (0x9B: control sequence introducer) is
24425
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2945 abbreviated to the escape sequence ESC '[' in a 7-bit environment.
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2946
61c6b3be1d51 Comment for ISO 2022 encoding mechanism modified.
Kenichi Handa <handa@m17n.org>
parents: 24344
diff changeset
2947 Character composition specification takes the following form:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2948 o ESC '0' -- start relative composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2949 o ESC '1' -- end composition
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2950 o ESC '2' -- start rule-base composition (*)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2951 o ESC '3' -- start relative composition with alternate chars (**)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2952 o ESC '4' -- start rule-base composition with alternate chars (**)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2953 Since these are not standard escape sequences of any ISO standard,
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2954 the use of them with these meanings is restricted to Emacs only.
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2955
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2956 (*) This form is used only in Emacs 20.7 and older versions,
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2957 but newer versions can safely decode it.
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2958 (**) This form is used only in Emacs 21.1 and newer versions,
88771
75c78754826d comments
Dave Love <fx@gnu.org>
parents: 88690
diff changeset
2959 and older versions can't decode it.
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2960
35053
e3e1ff3616fa Commentary changes.
Dave Love <fx@gnu.org>
parents: 34988
diff changeset
2961 Here's a list of example usages of these composition escape
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2962 sequences (categorized by `enum composition_method').
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2963
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2964 COMPOSITION_RELATIVE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2965 ESC 0 CHAR [ CHAR ] ESC 1
36087
05ef3feab39b Doc and message fixes.
Dave Love <fx@gnu.org>
parents: 35995
diff changeset
2966 COMPOSITION_WITH_RULE:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2967 ESC 2 CHAR [ RULE CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2968 COMPOSITION_WITH_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2969 ESC 3 ALTCHAR [ ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
2970 COMPOSITION_WITH_RULE_ALTCHARS:
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
2971 ESC 4 ALTCHAR [ RULE ALTCHAR ] ESC 0 CHAR [ CHAR ] ESC 1 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2972
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2973 enum iso_code_class_type iso_code_class[256];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
2974
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2975 #define SAFE_CHARSET_P(coding, id) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2976 ((id) <= (coding)->max_charset_id \
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
2977 && (coding)->safe_charsets[id] != 255)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2978
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2979
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2980 #define SHIFT_OUT_OK(category) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2981 (CODING_ISO_INITIAL (&coding_categories[category], 1) >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2982
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2983 static void
88631
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
2984 setup_iso_safe_charsets (attrs)
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
2985 Lisp_Object attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2986 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2987 Lisp_Object charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2988 Lisp_Object request;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2989 Lisp_Object reg_usage;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2990 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2991 int reg94, reg96;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2992 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2993 int max_charset_id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2994
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2995 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2996 if ((flags & CODING_ISO_FLAG_FULL_SUPPORT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2997 && ! EQ (charset_list, Viso_2022_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2998 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
2999 CODING_ATTR_CHARSET_LIST (attrs)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3000 = charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3001 ASET (attrs, coding_attr_safe_charsets, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3002 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3003
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3004 if (STRINGP (AREF (attrs, coding_attr_safe_charsets)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3005 return;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3006
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3007 max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3008 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3009 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3010 int id = XINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3011 if (max_charset_id < id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3012 max_charset_id = id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3013 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3014
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3015 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3016 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3017 request = AREF (attrs, coding_attr_iso_request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3018 reg_usage = AREF (attrs, coding_attr_iso_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3019 reg94 = XINT (XCAR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3020 reg96 = XINT (XCDR (reg_usage));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3021
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3022 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3023 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3024 Lisp_Object id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3025 Lisp_Object reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3026 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3027
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3028 id = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3029 charset = CHARSET_FROM_ID (XINT (id));
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3030 reg = Fcdr (Fassq (id, request));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3031 if (! NILP (reg))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3032 SSET (safe_charsets, XINT (id), XINT (reg));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3033 else if (charset->iso_chars_96)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3034 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3035 if (reg96 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3036 SSET (safe_charsets, XINT (id), reg96);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3037 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3038 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3039 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3040 if (reg94 < 4)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3041 SSET (safe_charsets, XINT (id), reg94);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3042 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3043 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3044 ASET (attrs, coding_attr_safe_charsets, safe_charsets);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3045 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3046
50047
8e17fbb2ac77 (CODING_ADD_COMPOSITION_COMPONENT): If the number of
Kenichi Handa <handa@m17n.org>
parents: 49600
diff changeset
3047
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3048 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3049 Check if a text is encoded in one of ISO-2022 based codig systems.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3050 If it is, return 1, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3051
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
3052 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3053 detect_coding_iso_2022 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3054 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3055 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3056 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3057 const unsigned char *src = coding->source, *src_base = src;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3058 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3059 int multibytep = coding->src_multibyte;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3060 int single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3061 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3062 int c, c1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3063 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3064 int i;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3065 int rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3066 int found = 0;
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3067 int composition_count = -1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3068
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3069 detect_info->checked |= CATEGORY_MASK_ISO;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3070
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3071 for (i = coding_category_iso_7; i <= coding_category_iso_8_else; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3072 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3073 struct coding_system *this = &(coding_categories[i]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3074 Lisp_Object attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3075
94944
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
3076 if (this->id < 0)
c16046e21b90 (detect_coding_iso_2022): Ignore a coding category that
Kenichi Handa <handa@m17n.org>
parents: 93877
diff changeset
3077 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3078 attrs = CODING_ID_ATTRS (this->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3079 if (CODING_ISO_FLAGS (this) & CODING_ISO_FLAG_FULL_SUPPORT
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3080 && ! EQ (CODING_ATTR_CHARSET_LIST (attrs), Viso_2022_charset_list))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3081 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3082 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3083 this->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3084 this->safe_charsets = SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3085 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3086
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3087 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3088 src += coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3089
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3090 while (rejected != CATEGORY_MASK_ISO)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3091 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3092 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3093 ONE_MORE_BYTE (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3094 switch (c)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3095 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3096 case ISO_CODE_ESC:
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3097 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3098 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3099 single_shifting = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3100 ONE_MORE_BYTE (c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3101 if (c >= '(' && c <= '/')
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3102 {
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3103 /* Designation sequence for a charset of dimension 1. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3104 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3105 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3106 || (id = iso_charset_table[0][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3107 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3108 break;
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3109 }
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3110 else if (c == '$')
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3111 {
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3112 /* Designation sequence for a charset of dimension 2. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3113 ONE_MORE_BYTE (c);
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3114 if (c >= '@' && c <= 'B')
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3115 /* Designation for JISX0208.1978, GB2312, or JISX0208. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3116 id = iso_charset_table[1][0][c];
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3117 else if (c >= '(' && c <= '/')
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
3118 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3119 ONE_MORE_BYTE (c1);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3120 if (c1 < ' ' || c1 >= 0x80
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3121 || (id = iso_charset_table[1][c >= ','][c1]) < 0)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3122 /* Invalid designation sequence. Just ignore. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3123 break;
17320
9d15bec5f47e (detect_coding_iso2022, detect_coding_mask): Ignore
Kenichi Handa <handa@m17n.org>
parents: 17304
diff changeset
3124 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3125 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3126 /* Invalid designation sequence. Just ignore it. */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3127 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3128 }
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3129 else if (c == 'N' || c == 'O')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3130 {
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3131 /* ESC <Fe> for SS2 or SS3. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3132 single_shifting = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3133 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3134 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3135 }
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3136 else if (c == '1')
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3137 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3138 /* End of composition. */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3139 if (composition_count < 0
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3140 || composition_count > MAX_COMPOSITION_COMPONENTS)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3141 /* Invalid */
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3142 break;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3143 composition_count = -1;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3144 found |= CATEGORY_MASK_ISO;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3145 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3146 else if (c >= '0' && c <= '4')
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3147 {
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3148 /* ESC <Fp> for start/end composition. */
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3149 composition_count = 0;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3150 break;
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3151 }
19134
8fa6e23f8d22 (detect_coding_iso2022): Do not exclude posibility of
Kenichi Handa <handa@m17n.org>
parents: 19118
diff changeset
3152 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3153 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3154 /* Invalid escape sequence. Just ignore it. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3155 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3156 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3157
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3158 /* We found a valid designation sequence for CHARSET. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3159 rejected |= CATEGORY_MASK_ISO_8BIT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3160 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3161 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3162 found |= CATEGORY_MASK_ISO_7;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3163 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3164 rejected |= CATEGORY_MASK_ISO_7;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3165 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_tight],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3166 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3167 found |= CATEGORY_MASK_ISO_7_TIGHT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3168 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3169 rejected |= CATEGORY_MASK_ISO_7_TIGHT;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3170 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_7_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3171 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3172 found |= CATEGORY_MASK_ISO_7_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3173 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3174 rejected |= CATEGORY_MASK_ISO_7_ELSE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3175 if (SAFE_CHARSET_P (&coding_categories[coding_category_iso_8_else],
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3176 id))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3177 found |= CATEGORY_MASK_ISO_8_ELSE;
23116
6736da064f4a (detect_coding_iso2022): Handle ESC N and ESC O
Kenichi Handa <handa@m17n.org>
parents: 23089
diff changeset
3178 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3179 rejected |= CATEGORY_MASK_ISO_8_ELSE;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3180 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3181
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3182 case ISO_CODE_SO:
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3183 case ISO_CODE_SI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3184 /* Locking shift out/in. */
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3185 if (inhibit_iso_escape_detection)
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
3186 break;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3187 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3188 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_8BIT;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3189 break;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3190
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3191 case ISO_CODE_CSI:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3192 /* Control sequence introducer. */
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3193 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3194 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3195 found |= CATEGORY_MASK_ISO_8_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3196 goto check_extra_latin;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3197
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3198 case ISO_CODE_SS2:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3199 case ISO_CODE_SS3:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3200 /* Single shift. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3201 if (inhibit_iso_escape_detection)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3202 break;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3203 single_shifting = 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3204 rejected |= CATEGORY_MASK_ISO_7BIT;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3205 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3206 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3207 found |= CATEGORY_MASK_ISO_8_1, single_shifting = 1;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3208 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_2])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3209 & CODING_ISO_FLAG_SINGLE_SHIFT)
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3210 found |= CATEGORY_MASK_ISO_8_2, single_shifting = 1;
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3211 if (single_shifting)
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3212 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3213 goto check_extra_latin;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3214
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3215 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3216 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3217 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3218 if (c < 0x80)
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3219 {
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3220 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3221 composition_count++;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3222 single_shifting = 0;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3223 break;
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3224 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3225 if (c >= 0xA0)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
3226 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3227 rejected |= CATEGORY_MASK_ISO_7BIT | CATEGORY_MASK_ISO_7_ELSE;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3228 found |= CATEGORY_MASK_ISO_8_1;
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3229 /* Check the length of succeeding codes of the range
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3230 0xA0..0FF. If the byte length is even, we include
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3231 CATEGORY_MASK_ISO_8_2 in `found'. We can check this
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3232 only when we are not single shifting. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3233 if (! single_shifting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3234 && ! (rejected & CATEGORY_MASK_ISO_8_2))
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3235 {
29299
b33b38d81020 (detect_coding_iso2022): Fix code for checking
Kenichi Handa <handa@m17n.org>
parents: 29275
diff changeset
3236 int i = 1;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3237 while (src < src_end)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3238 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3239 ONE_MORE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3240 if (c < 0xA0)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3241 break;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3242 i++;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3243 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3244
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3245 if (i & 1 && src < src_end)
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3246 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3247 rejected |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3248 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3249 composition_count += i;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3250 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3251 else
99753
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3252 {
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3253 found |= CATEGORY_MASK_ISO_8_2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3254 if (composition_count >= 0)
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3255 composition_count += i / 2;
c457d1e5edff (detect_coding_iso_2022): Reject invalid composition
Kenichi Handa <handa@m17n.org>
parents: 99074
diff changeset
3256 }
23088
45c36d636f66 (detect_coding_iso2022): Don't check the byte length of
Kenichi Handa <handa@m17n.org>
parents: 23082
diff changeset
3257 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3258 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3259 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3260 check_extra_latin:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3261 single_shifting = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3262 if (! VECTORP (Vlatin_extra_code_table)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3263 || NILP (XVECTOR (Vlatin_extra_code_table)->contents[c]))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3264 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3265 rejected = CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3266 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3267 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3268 if (CODING_ISO_FLAGS (&coding_categories[coding_category_iso_8_1])
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3269 & CODING_ISO_FLAG_LATIN_EXTRA)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3270 found |= CATEGORY_MASK_ISO_8_1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3271 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3272 rejected |= CATEGORY_MASK_ISO_8_1;
89780
a53cb5864a40 (detect_coding_iso_2022): Fix handling of SS2 and SS3.
Kenichi Handa <handa@m17n.org>
parents: 89779
diff changeset
3273 rejected |= CATEGORY_MASK_ISO_8_2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3274 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3275 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3276 detect_info->rejected |= CATEGORY_MASK_ISO;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3277 return 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3278
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3279 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3280 detect_info->rejected |= rejected;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3281 detect_info->found |= (found & ~rejected);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3282 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3283 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3284
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3285
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3286 /* Set designation state into CODING. Set CHARS_96 to -1 if the
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3287 escape sequence should be kept. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3288 #define DECODE_DESIGNATION(reg, dim, chars_96, final) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3289 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3290 int id, prev; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3291 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3292 if (final < '0' || final >= 128 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3293 || ((id = ISO_CHARSET_TABLE (dim, chars_96, final)) < 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3294 || !SAFE_CHARSET_P (coding, id)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3295 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3296 CODING_ISO_DESIGNATION (coding, reg) = -2; \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3297 chars_96 = -1; \
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3298 break; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3299 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3300 prev = CODING_ISO_DESIGNATION (coding, reg); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3301 if (id == charset_jisx0201_roman) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3302 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3303 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3304 id = charset_ascii; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3305 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3306 else if (id == charset_jisx0208_1978) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3307 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3308 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3309 id = charset_jisx0208; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
3310 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3311 CODING_ISO_DESIGNATION (coding, reg) = id; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3312 /* If there was an invalid designation to REG previously, and this \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3313 designation is ASCII to REG, we should keep this designation \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3314 sequence. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3315 if (prev == -2 && id == charset_ascii) \
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3316 chars_96 = -1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3317 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3318
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3319
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3320 /* Handle these composition sequence (ALT: alternate char):
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3321
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3322 (1) relative composition: ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3323 (2) rulebase composition: ESC 2 CHAR RULE CHAR RULE ... CHAR ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3324 (3) altchar composition: ESC 3 ALT ... ALT ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3325 (4) alt&rule composition: ESC 4 ALT RULE ... ALT ESC 0 CHAR ... ESC 1
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3326
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3327 When the start sequence (ESC 0/2/3/4) is found, this annotation
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3328 header is produced.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3329
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3330 [ -LENGTH(==-5) CODING_ANNOTATE_COMPOSITION_MASK NCHARS(==0) 0 METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3331
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3332 Then, upon reading CHAR or RULE (one or two bytes), these codes are
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3333 produced until the end sequence (ESC 1) is found:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3334
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3335 (1) CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3336 (2) CHAR -2 DECODED-RULE CHAR -2 DECODED-RULE ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3337 (3) ALT ... ALT -1 -1 CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3338 (4) ALT -2 DECODED-RULE ALT -2 DECODED-RULE ... ALT -1 -1 CHAR ... CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3339
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3340 When the end sequence (ESC 1) is found, LENGTH and NCHARS in the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3341 annotation header is updated as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3342
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3343 (1) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3344 (2) LENGTH: unchanged, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3345 (3) LENGTH: += number of ALTs + 2, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3346 (4) LENGTH: += number of ALTs * 3, NCHARS: number of CHARs
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3347
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3348 If an error is found while composing, the annotation header is
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3349 changed to:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3350
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3351 [ ESC '0'/'2'/'3'/'4' -2 0 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3352
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3353 and the sequence [ -2 DECODED-RULE ] is changed to the original
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3354 byte sequence as below:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3355 o the original byte sequence is B: [ B -1 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3356 o the original byte sequence is B1 B2: [ B1 B2 ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3357 and the sequence [ -1 -1 ] is changed to the original byte
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3358 sequence:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3359 [ ESC '0' ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3360 */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3361
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3362 /* Decode a composition rule C1 and maybe one more byte from the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3363 source, and set RULE to the encoded composition rule, NBYTES to the
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3364 length of the composition rule. If the rule is invalid, set RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3365 to some negative value. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3366
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3367 #define DECODE_COMPOSITION_RULE(rule, nbytes) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3368 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3369 rule = c1 - 32; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3370 if (rule < 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3371 break; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3372 if (rule < 81) /* old format (before ver.21) */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3373 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3374 int gref = (rule) / 9; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3375 int nref = (rule) % 9; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3376 if (gref == 4) gref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3377 if (nref == 4) nref = 10; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3378 rule = COMPOSITION_ENCODE_RULE (gref, nref); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3379 nbytes = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3380 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3381 else /* new format (after ver.21) */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3382 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3383 int c; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3384 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3385 ONE_MORE_BYTE (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3386 rule = COMPOSITION_ENCODE_RULE (rule - 81, c - 32); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3387 if (rule >= 0) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3388 rule += 0x100; /* to destinguish it from the old format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3389 nbytes = 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3390 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3391 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3392
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3393 #define ENCODE_COMPOSITION_RULE(rule) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3394 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3395 int gref = (rule % 0x100) / 12, nref = (rule % 0x100) % 12; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3396 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3397 if (rule < 0x100) /* old format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3398 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3399 if (gref == 10) gref = 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3400 if (nref == 10) nref = 4; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3401 charbuf[idx] = 32 + gref * 9 + nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3402 charbuf[idx + 1] = -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3403 new_chars++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3404 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3405 else /* new format */ \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3406 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3407 charbuf[idx] = 32 + 81 + gref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3408 charbuf[idx + 1] = 32 + nref; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3409 new_chars += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3410 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3411 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3412
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3413 /* Finish the current composition as invalid. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3414
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3415 static int finish_composition P_ ((int *, struct composition_status *));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3416
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3417 static int
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3418 finish_composition (charbuf, cmp_status)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3419 int *charbuf;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3420 struct composition_status *cmp_status;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3421 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3422 int idx = - cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3423 int new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3424
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3425 /* Recover the original ESC sequence */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3426 charbuf[idx++] = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3427 charbuf[idx++] = (cmp_status->method == COMPOSITION_RELATIVE ? '0'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3428 : cmp_status->method == COMPOSITION_WITH_RULE ? '2'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3429 : cmp_status->method == COMPOSITION_WITH_ALTCHARS ? '3'
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3430 /* cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3431 : '4');
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3432 charbuf[idx++] = -2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3433 charbuf[idx++] = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3434 charbuf[idx++] = -1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3435 new_chars = cmp_status->nchars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3436 if (cmp_status->method >= COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3437 for (; idx < 0; idx++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3438 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3439 int elt = charbuf[idx];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3440
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3441 if (elt == -2)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3442 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3443 ENCODE_COMPOSITION_RULE (charbuf[idx + 1]);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3444 idx++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3445 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3446 else if (elt == -1)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3447 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3448 charbuf[idx++] = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3449 charbuf[idx] = '0';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3450 new_chars += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3451 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3452 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3453 cmp_status->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3454 return new_chars;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3455 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3456
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3457 /* If characers are under composition, finish the composition. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3458 #define MAYBE_FINISH_COMPOSITION() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3459 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3460 if (cmp_status->state != COMPOSING_NO) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3461 char_offset += finish_composition (charbuf, cmp_status); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3462 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3463
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3464 /* Handle composition start sequence ESC 0, ESC 2, ESC 3, or ESC 4.
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3465
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3466 ESC 0 : relative composition : ESC 0 CHAR ... ESC 1
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
3467 ESC 2 : rulebase composition : ESC 2 CHAR RULE CHAR RULE ... CHAR ESC 1
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3468 ESC 3 : altchar composition : ESC 3 CHAR ... ESC 0 CHAR ... ESC 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3469 ESC 4 : alt&rule composition : ESC 4 CHAR RULE ... CHAR ESC 0 CHAR ... ESC 1
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3470
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3471 Produce this annotation sequence now:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3472
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3473 [ -LENGTH(==-4) CODING_ANNOTATE_COMPOSITION_MASK NCHARS(==0) METHOD ]
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3474 */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3475
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3476 #define DECODE_COMPOSITION_START(c1) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3477 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3478 if (c1 == '0' \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3479 && ((cmp_status->state == COMPOSING_COMPONENT_CHAR \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3480 && cmp_status->method == COMPOSITION_WITH_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3481 || (cmp_status->state == COMPOSING_COMPONENT_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3482 && cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS))) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3483 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3484 *charbuf++ = -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3485 *charbuf++= -1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3486 cmp_status->state = COMPOSING_CHAR; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3487 cmp_status->length += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3488 } \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3489 else \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3490 { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3491 MAYBE_FINISH_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3492 cmp_status->method = (c1 == '0' ? COMPOSITION_RELATIVE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3493 : c1 == '2' ? COMPOSITION_WITH_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3494 : c1 == '3' ? COMPOSITION_WITH_ALTCHARS \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3495 : COMPOSITION_WITH_RULE_ALTCHARS); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3496 cmp_status->state \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3497 = (c1 <= '2' ? COMPOSING_CHAR : COMPOSING_COMPONENT_CHAR); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3498 ADD_COMPOSITION_DATA (charbuf, 0, 0, cmp_status->method); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3499 cmp_status->length = MAX_ANNOTATION_LENGTH; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3500 cmp_status->nchars = cmp_status->ncomps = 0; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3501 coding->annotated = 1; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3502 } \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3503 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3504
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3505
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3506 /* Handle composition end sequence ESC 1. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3507
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3508 #define DECODE_COMPOSITION_END() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3509 do { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3510 if (cmp_status->nchars == 0 \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3511 || ((cmp_status->state == COMPOSING_CHAR) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3512 == (cmp_status->method == COMPOSITION_WITH_RULE))) \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3513 { \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3514 MAYBE_FINISH_COMPOSITION (); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3515 goto invalid_code; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3516 } \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3517 if (cmp_status->method == COMPOSITION_WITH_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3518 charbuf[- cmp_status->length] -= cmp_status->ncomps + 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3519 else if (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3520 charbuf[- cmp_status->length] -= cmp_status->ncomps * 3; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3521 charbuf[- cmp_status->length + 2] = cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3522 char_offset += cmp_status->nchars; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3523 cmp_status->state = COMPOSING_NO; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3524 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3525
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3526 /* Store a composition rule RULE in charbuf, and update cmp_status. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3527
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3528 #define STORE_COMPOSITION_RULE(rule) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3529 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3530 *charbuf++ = -2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3531 *charbuf++ = rule; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3532 cmp_status->length += 2; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3533 cmp_status->state--; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3534 } while (0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3535
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3536 /* Store a composed char or a component char C in charbuf, and update
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3537 cmp_status. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3538
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3539 #define STORE_COMPOSITION_CHAR(c) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3540 do { \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3541 *charbuf++ = (c); \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3542 cmp_status->length++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3543 if (cmp_status->state == COMPOSING_CHAR) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3544 cmp_status->nchars++; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3545 else \
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3546 cmp_status->ncomps++; \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3547 if (cmp_status->method == COMPOSITION_WITH_RULE \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3548 || (cmp_status->method == COMPOSITION_WITH_RULE_ALTCHARS \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3549 && cmp_status->state == COMPOSING_COMPONENT_CHAR)) \
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3550 cmp_status->state++; \
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3551 } while (0)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3552
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3553
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3554 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3555
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3556 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3557 decode_coding_iso_2022 (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3558 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3559 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3560 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3561 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
3562 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3563 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
3564 /* We may produce two annocations (charset and composition) in one
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
3565 loop and one more charset annocation at the end. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3566 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
3567 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 3);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3568 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3569 int multibytep = coding->src_multibyte;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3570 /* Charsets invoked to graphic plane 0 and 1 respectively. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3571 int charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3572 int charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3573 int charset_id_2, charset_id_3;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3574 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3575 int c;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3576 struct composition_status *cmp_status = CODING_ISO_CMP_STATUS (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3577 Lisp_Object attrs, charset_list;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3578 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3579 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3580 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
3581 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
3582 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3583 int byte_after_cr = -1;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3584 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3585
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
3586 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3587 setup_iso_safe_charsets (attrs);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3588 /* Charset list may have been changed. */
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
3589 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
3590 coding->safe_charsets = SDATA (CODING_ATTR_SAFE_CHARSETS (attrs));
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3591
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3592 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3593 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3594 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3595 *charbuf++ = cmp_status->carryover[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3596 coding->annotated = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3597 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3598
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3599 while (1)
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3600 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3601 int c1, c2;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3602
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3603 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3604 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3605
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3606 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3607 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3608 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3609 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3610 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
3611 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3612
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3613 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3614 c1 = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3615 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3616 ONE_MORE_BYTE (c1);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3617 if (c1 < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
3618 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3619
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3620 if (CODING_ISO_EXTSEGMENT_LEN (coding) > 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3621 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3622 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3623 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3624 CODING_ISO_EXTSEGMENT_LEN (coding)--;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3625 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3626 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3627
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3628 if (CODING_ISO_EMBEDDED_UTF_8 (coding))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3629 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3630 if (c1 == ISO_CODE_ESC)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3631 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3632 if (src + 1 >= src_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3633 goto no_more_source;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3634 *charbuf++ = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3635 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3636 if (src[0] == '%' && src[1] == '@')
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3637 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3638 src += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3639 consumed_chars += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3640 char_offset += 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3641 /* We are sure charbuf can contain two more chars. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3642 *charbuf++ = '%';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3643 *charbuf++ = '@';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3644 CODING_ISO_EMBEDDED_UTF_8 (coding) = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3645 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3646 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3647 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3648 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3649 *charbuf++ = ASCII_BYTE_P (c1) ? c1 : BYTE8_TO_CHAR (c1);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3650 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3651 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3652 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3653 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3654
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3655 if ((cmp_status->state == COMPOSING_RULE
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3656 || cmp_status->state == COMPOSING_COMPONENT_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3657 && c1 != ISO_CODE_ESC)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3658 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3659 int rule, nbytes;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3660
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3661 DECODE_COMPOSITION_RULE (rule, nbytes);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3662 if (rule < 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3663 goto invalid_code;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3664 STORE_COMPOSITION_RULE (rule);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3665 continue;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3666 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3667
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
3668 /* We produce at most one character. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3669 switch (iso_code_class [c1])
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3670 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3671 case ISO_0x20_or_0x7F:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3672 if (charset_id_0 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3673 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_0)))
88585
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3674 /* This is SPACE or DEL. */
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3675 charset = CHARSET_FROM_ID (charset_ascii);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3676 else
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3677 charset = CHARSET_FROM_ID (charset_id_0);
c7772f702227 (ONE_MORE_BYTE_NO_CHECK): Increment consumed_chars.
Kenichi Handa <handa@m17n.org>
parents: 88573
diff changeset
3678 break;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3679
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3680 case ISO_graphic_plane_0:
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3681 if (charset_id_0 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3682 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3683 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3684 charset = CHARSET_FROM_ID (charset_id_0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3685 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3686
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3687 case ISO_0xA0_or_0xFF:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3688 if (charset_id_1 < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3689 || ! CHARSET_ISO_CHARS_96 (CHARSET_FROM_ID (charset_id_1))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3690 || CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3691 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3692 /* This is a graphic character, we fall down ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3693
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3694 case ISO_graphic_plane_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3695 if (charset_id_1 < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3696 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3697 charset = CHARSET_FROM_ID (charset_id_1);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3698 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3699
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3700 case ISO_control_0:
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3701 if (eol_crlf && c1 == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
3702 ONE_MORE_BYTE (byte_after_cr);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3703 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3704 charset = CHARSET_FROM_ID (charset_ascii);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3705 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3706
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3707 case ISO_control_1:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3708 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3709
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3710 case ISO_shift_out:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3711 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3712 || CODING_ISO_DESIGNATION (coding, 1) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3713 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3714 CODING_ISO_INVOCATION (coding, 0) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3715 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3716 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3717
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3718 case ISO_shift_in:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3719 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3720 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3721 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3722 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3723 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3724
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3725 case ISO_single_shift_2_7:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3726 case ISO_single_shift_2:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3727 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3728 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3729 /* SS2 is handled as an escape sequence of ESC 'N' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3730 c1 = 'N';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3731 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3732
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3733 case ISO_single_shift_3:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3734 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3735 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3736 /* SS2 is handled as an escape sequence of ESC 'O' */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3737 c1 = 'O';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3738 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3739
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3740 case ISO_control_sequence_introducer:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3741 /* CSI is handled as an escape sequence of ESC '[' ... */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3742 c1 = '[';
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3743 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3744
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3745 case ISO_escape:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3746 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3747 label_escape_sequence:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3748 /* Escape sequences handled here are invocation,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3749 designation, direction specification, and character
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3750 composition specification. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3751 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3752 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3753 case '&': /* revision of following character set */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3754 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3755 if (!(c1 >= '@' && c1 <= '~'))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3756 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3757 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3758 if (c1 != ISO_CODE_ESC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3759 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3760 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3761 goto label_escape_sequence;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3762
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3763 case '$': /* designation of 2-byte character set */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3764 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3765 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3766 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3767 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3768
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3769 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3770 if (c1 >= '@' && c1 <= 'B')
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3771 { /* designation of JISX0208.1978, GB2312.1980,
23339
2da87b489590 (check_composing_code): Fix previous change. Now it
Kenichi Handa <handa@m17n.org>
parents: 23325
diff changeset
3772 or JISX0208.1980 */
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3773 reg = 0, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3774 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3775 else if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3776 { /* designation of DIMENSION2_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3777 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3778 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3779 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3780 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3781 { /* designation of DIMENSION2_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3782 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3783 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3784 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3785 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3786 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3787 DECODE_DESIGNATION (reg, 2, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3788 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3789 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3790 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3791 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3792 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3793 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3794 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3795 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3796 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3797
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3798 case 'n': /* invocation of locking-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3799 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3800 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3801 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3802 CODING_ISO_INVOCATION (coding, 0) = 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3803 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3804 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3805
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3806 case 'o': /* invocation of locking-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3807 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LOCKING_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3808 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3809 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3810 CODING_ISO_INVOCATION (coding, 0) = 3;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3811 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3812 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3813
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3814 case 'N': /* invocation of single-shift-2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3815 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3816 || CODING_ISO_DESIGNATION (coding, 2) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3817 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3818 charset_id_2 = CODING_ISO_DESIGNATION (coding, 2);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3819 if (charset_id_2 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3820 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3821 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3822 charset = CHARSET_FROM_ID (charset_id_2);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3823 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3824 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3825 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3826 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3827
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3828 case 'O': /* invocation of single-shift-3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3829 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3830 || CODING_ISO_DESIGNATION (coding, 3) < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3831 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3832 charset_id_3 = CODING_ISO_DESIGNATION (coding, 3);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3833 if (charset_id_3 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3834 charset = CHARSET_FROM_ID (charset_ascii);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3835 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3836 charset = CHARSET_FROM_ID (charset_id_3);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3837 ONE_MORE_BYTE (c1);
30578
705b94e152b1 (decode_coding_iso2022): More strict check for handling single
Kenichi Handa <handa@m17n.org>
parents: 30487
diff changeset
3838 if (c1 < 0x20 || (c1 >= 0x80 && c1 < 0xA0))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3839 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3840 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3841
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3842 case '0': case '2': case '3': case '4': /* start composition */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3843 if (! (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3844 goto invalid_code;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3845 if (last_id != charset_ascii)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3846 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3847 ADD_CHARSET_DATA (charbuf, char_offset- last_offset, last_id);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3848 last_id = charset_ascii;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3849 last_offset = char_offset;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3850 }
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3851 DECODE_COMPOSITION_START (c1);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3852 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3853
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
3854 case '1': /* end composition */
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3855 if (cmp_status->state == COMPOSING_NO)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3856 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3857 DECODE_COMPOSITION_END ();
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3858 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3859
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3860 case '[': /* specification of direction */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3861 if (! CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DIRECTION)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3862 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3863 /* For the moment, nested direction is not supported.
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3864 So, `coding->mode & CODING_MODE_DIRECTION' zero means
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3865 left-to-right, and nozero means right-to-left. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3866 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3867 switch (c1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3868 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3869 case ']': /* end of the current direction */
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3870 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3871
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3872 case '0': /* end of the current direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3873 case '1': /* start of left-to-right direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3874 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3875 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3876 coding->mode &= ~CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3877 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3878 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3879 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3880
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3881 case '2': /* start of right-to-left direction */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3882 ONE_MORE_BYTE (c1);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3883 if (c1 == ']')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
3884 coding->mode |= CODING_MODE_DIRECTION;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3885 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3886 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3887 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3888
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3889 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3890 goto invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3891 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3892 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3893
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3894 case '%':
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3895 ONE_MORE_BYTE (c1);
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3896 if (c1 == '/')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3897 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3898 /* CTEXT extended segment:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3899 ESC % / [0-4] M L --ENCODING-NAME-- \002 --BYTES--
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3900 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3901 They may be decoded by post-read-conversion. */
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3902 int dim, M, L;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3903 int size;
56191
75f56340b4f9 (MAX_ALLOCA): Remove define.
Kim F. Storm <storm@cua.dk>
parents: 56028
diff changeset
3904
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3905 ONE_MORE_BYTE (dim);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3906 if (dim < 0 || dim > 4)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3907 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3908 ONE_MORE_BYTE (M);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3909 if (M < 128)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3910 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3911 ONE_MORE_BYTE (L);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3912 if (L < 128)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3913 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3914 size = ((M - 128) * 128) + (L - 128);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3915 if (charbuf + 6 > charbuf_end)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3916 goto break_loop;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3917 *charbuf++ = ISO_CODE_ESC;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3918 *charbuf++ = '%';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3919 *charbuf++ = '/';
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3920 *charbuf++ = dim;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3921 *charbuf++ = BYTE8_TO_CHAR (M);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3922 *charbuf++ = BYTE8_TO_CHAR (L);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3923 CODING_ISO_EXTSEGMENT_LEN (coding) = size;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3924 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3925 else if (c1 == 'G')
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3926 {
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3927 /* XFree86 extension for embedding UTF-8 in CTEXT:
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3928 ESC % G --UTF-8-BYTES-- ESC % @
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3929 We keep these bytes as is for the moment.
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3930 They may be decoded by post-read-conversion. */
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3931 if (charbuf + 3 > charbuf_end)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3932 goto break_loop;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3933 *charbuf++ = ISO_CODE_ESC;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3934 *charbuf++ = '%';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3935 *charbuf++ = 'G';
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3936 CODING_ISO_EMBEDDED_UTF_8 (coding) = 1;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3937 }
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3938 else
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3939 goto invalid_code;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3940 continue;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
3941 break;
51311
e723bcb43569 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 51231
diff changeset
3942
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3943 default:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3944 if (! (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATION))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3945 goto invalid_code;
89873
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3946 {
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3947 int reg, chars96;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3948
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3949 if (c1 >= 0x28 && c1 <= 0x2B)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3950 { /* designation of DIMENSION1_CHARS94 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3951 reg = c1 - 0x28, chars96 = 0;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3952 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3953 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3954 else if (c1 >= 0x2C && c1 <= 0x2F)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3955 { /* designation of DIMENSION1_CHARS96 character set */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3956 reg = c1 - 0x2C, chars96 = 1;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3957 ONE_MORE_BYTE (c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3958 }
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3959 else
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3960 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3961 DECODE_DESIGNATION (reg, 1, chars96, c1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3962 /* We must update these variables now. */
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3963 if (reg == 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3964 charset_id_0 = CODING_ISO_INVOKED_CHARSET (coding, 0);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3965 else if (reg == 1)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3966 charset_id_1 = CODING_ISO_INVOKED_CHARSET (coding, 1);
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3967 if (chars96 < 0)
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3968 goto invalid_code;
9a279ff9d245 (DECODE_DESIGNATION): Set chars_96 to -1 instead of
Kenichi Handa <handa@m17n.org>
parents: 89863
diff changeset
3969 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3970 continue;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
3971 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3972 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3973
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3974 if (cmp_status->state == COMPOSING_NO
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
3975 && charset->id != charset_ascii
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3976 && last_id != charset->id)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3977 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3978 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
3979 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3980 last_id = charset->id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3981 last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3982 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
3983
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3984 /* Now we know CHARSET and 1st position code C1 of a character.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3985 Produce a decoded character while getting 2nd position code
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3986 C2 if necessary. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3987 c1 &= 0x7F;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3988 if (CHARSET_DIMENSION (charset) > 1)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3989 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3990 ONE_MORE_BYTE (c2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3991 if (c2 < 0x20 || (c2 >= 0x80 && c2 < 0xA0))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
3992 /* C2 is not in a valid range. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3993 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3994 c1 = (c1 << 8) | (c2 & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3995 if (CHARSET_DIMENSION (charset) > 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3996 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3997 ONE_MORE_BYTE (c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3998 if (c2 < 0x20 || (c2 >= 0x80 && c2 < 0xA0))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
3999 /* C2 is not in a valid range. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4000 goto invalid_code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4001 c1 = (c1 << 8) | (c2 & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4002 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4003 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4004
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4005 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c1, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4006 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4007 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4008 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4009 for (; src_base < src; src_base++, char_offset++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4010 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4011 if (ASCII_BYTE_P (*src_base))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4012 *charbuf++ = *src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4013 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4014 *charbuf++ = BYTE8_TO_CHAR (*src_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4015 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4016 }
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4017 else if (cmp_status->state == COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4018 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4019 *charbuf++ = c;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4020 char_offset++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4021 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4022 else if ((cmp_status->state == COMPOSING_CHAR
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4023 ? cmp_status->nchars
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4024 : cmp_status->ncomps)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4025 >= MAX_COMPOSITION_COMPONENTS)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4026 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4027 /* Too long composition. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4028 MAYBE_FINISH_COMPOSITION ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4029 *charbuf++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4030 char_offset++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4031 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4032 else
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4033 STORE_COMPOSITION_CHAR (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4034 continue;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4035
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4036 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4037 MAYBE_FINISH_COMPOSITION ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4038 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4039 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4040 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4041 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4042 char_offset++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4043 coding->errors++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4044 continue;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4045
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4046 break_loop:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
4047 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4048 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4049
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4050 no_more_source:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4051 if (cmp_status->state != COMPOSING_NO)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4052 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4053 if (coding->mode & CODING_MODE_LAST_BLOCK)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4054 MAYBE_FINISH_COMPOSITION ();
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4055 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4056 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4057 charbuf -= cmp_status->length;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4058 for (i = 0; i < cmp_status->length; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4059 cmp_status->carryover[i] = charbuf[i];
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4060 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4061 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
4062 else if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4063 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4064 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4065 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4066 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4067 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4068
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4069
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4070 /* ISO2022 encoding stuff. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4071
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4072 /*
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4073 It is not enough to say just "ISO2022" on encoding, we have to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4074 specify more details. In Emacs, each coding system of ISO2022
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4075 variant has the following specifications:
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4076 1. Initial designation to G0 thru G3.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4077 2. Allows short-form designation?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4078 3. ASCII should be designated to G0 before control characters?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4079 4. ASCII should be designated to G0 at end of line?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4080 5. 7-bit environment or 8-bit environment?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4081 6. Use locking-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4082 7. Use Single-shift?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4083 And the following two are only for Japanese:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4084 8. Use ASCII in place of JIS0201-1976-Roman?
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4085 9. Use JISX0208-1983 in place of JISX0208-1978?
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4086 These specifications are encoded in CODING_ISO_FLAGS (coding) as flag bits
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4087 defined by macros CODING_ISO_FLAG_XXX. See `coding.h' for more
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4088 details.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4089 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4090
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4091 /* Produce codes (escape sequence) for designating CHARSET to graphic
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4092 register REG at DST, and increment DST. If <final-char> of CHARSET is
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4093 '@', 'A', or 'B' and the coding system CODING allows, produce
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4094 designation sequence of short-form. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4095
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4096 #define ENCODE_DESIGNATION(charset, reg, coding) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4097 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4098 unsigned char final_char = CHARSET_ISO_FINAL (charset); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4099 char *intermediate_char_94 = "()*+"; \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4100 char *intermediate_char_96 = ",-./"; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4101 int revision = -1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4102 int c; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4103 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4104 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_REVISION) \
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
4105 revision = CHARSET_ISO_REVISION (charset); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4106 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4107 if (revision >= 0) \
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
4108 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4109 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '&'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4110 EMIT_ONE_BYTE ('@' + revision); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4111 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4112 EMIT_ONE_ASCII_BYTE (ISO_CODE_ESC); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4113 if (CHARSET_DIMENSION (charset) == 1) \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4114 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4115 if (! CHARSET_ISO_CHARS_96 (charset)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4116 c = intermediate_char_94[reg]; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4117 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4118 c = intermediate_char_96[reg]; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4119 EMIT_ONE_ASCII_BYTE (c); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4120 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4121 else \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4122 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4123 EMIT_ONE_ASCII_BYTE ('$'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4124 if (! CHARSET_ISO_CHARS_96 (charset)) \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4125 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4126 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_LONG_FORM \
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4127 || reg != 0 \
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4128 || final_char < '@' || final_char > 'B') \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4129 EMIT_ONE_ASCII_BYTE (intermediate_char_94[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4130 } \
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4131 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4132 EMIT_ONE_ASCII_BYTE (intermediate_char_96[reg]); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4133 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4134 EMIT_ONE_ASCII_BYTE (final_char); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4135 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4136 CODING_ISO_DESIGNATION (coding, reg) = CHARSET_ID (charset); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4137 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4138
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4139
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4140 /* The following two macros produce codes (control character or escape
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4141 sequence) for ISO2022 single-shift functions (single-shift-2 and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4142 single-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4143
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4144 #define ENCODE_SINGLE_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4145 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4146 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4147 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'N'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4148 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4149 EMIT_ONE_BYTE (ISO_CODE_SS2); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4150 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4151 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4152
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4153
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4154 #define ENCODE_SINGLE_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4155 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4156 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4157 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'O'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4158 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4159 EMIT_ONE_BYTE (ISO_CODE_SS3); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4160 CODING_ISO_SINGLE_SHIFTING (coding) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4161 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4162
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4163
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4164 /* The following four macros produce codes (control character or
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4165 escape sequence) for ISO2022 locking-shift functions (shift-in,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4166 shift-out, locking-shift-2, and locking-shift-3). */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4167
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4168 #define ENCODE_SHIFT_IN \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4169 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4170 EMIT_ONE_ASCII_BYTE (ISO_CODE_SI); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4171 CODING_ISO_INVOCATION (coding, 0) = 0; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4172 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4173
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4174
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4175 #define ENCODE_SHIFT_OUT \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4176 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4177 EMIT_ONE_ASCII_BYTE (ISO_CODE_SO); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4178 CODING_ISO_INVOCATION (coding, 0) = 1; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4179 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4180
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4181
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4182 #define ENCODE_LOCKING_SHIFT_2 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4183 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4184 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4185 CODING_ISO_INVOCATION (coding, 0) = 2; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4186 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4187
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4188
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4189 #define ENCODE_LOCKING_SHIFT_3 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4190 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4191 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, 'n'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4192 CODING_ISO_INVOCATION (coding, 0) = 3; \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4193 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4194
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4195
18766
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4196 /* Produce codes for a DIMENSION1 character whose character set is
ac2e7e21abb0 Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18747
diff changeset
4197 CHARSET and whose position-code is C1. Designation and invocation
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4198 sequences are also produced in advance if necessary. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4199
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4200 #define ENCODE_ISO_CHARACTER_DIMENSION1(charset, c1) \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4201 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4202 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4203 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4204 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_ROMAN) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4205 && id == charset_ascii) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4206 { \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4207 id = charset_jisx0201_roman; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4208 charset = CHARSET_FROM_ID (id); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4209 } \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4210 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4211 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4212 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4213 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4214 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4215 else \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4216 EMIT_ONE_BYTE (c1 | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4217 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4218 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4219 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4220 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4221 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4222 EMIT_ONE_ASCII_BYTE (c1 & 0x7F); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4223 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4224 } \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4225 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4226 { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4227 EMIT_ONE_BYTE (c1 | 0x80); \
19285
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4228 break; \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4229 } \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4230 else \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4231 /* Since CHARSET is not yet invoked to any graphic planes, we \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4232 must invoke it, or, at first, designate it to some graphic \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4233 register. Then repeat the loop to actually produce the \
af3d00fde172 (Fset_terminal_coding_system_internal): Set
Kenichi Handa <handa@m17n.org>
parents: 19280
diff changeset
4234 character. */ \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4235 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4236 &produced_chars); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4237 } while (1)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4238
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4239
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4240 /* Produce codes for a DIMENSION2 character whose character set is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4241 CHARSET and whose position-codes are C1 and C2. Designation and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4242 invocation codes are also produced in advance if necessary. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4243
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4244 #define ENCODE_ISO_CHARACTER_DIMENSION2(charset, c1, c2) \
24506
219c99669e4b (ENCODE_ISO_CHARACTER): Check validity of CHARSET. If
Kenichi Handa <handa@m17n.org>
parents: 24460
diff changeset
4245 do { \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4246 int id = CHARSET_ID (charset); \
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4247 \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4248 if ((CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_USE_OLDJIS) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4249 && id == charset_jisx0208) \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4250 { \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4251 id = charset_jisx0208_1978; \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4252 charset = CHARSET_FROM_ID (id); \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4253 } \
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4254 \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4255 if (CODING_ISO_SINGLE_SHIFTING (coding)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4256 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4257 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4258 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4259 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4260 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4261 CODING_ISO_SINGLE_SHIFTING (coding) = 0; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4262 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4263 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4264 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 0)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4265 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4266 EMIT_TWO_ASCII_BYTES ((c1) & 0x7F, (c2) & 0x7F); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4267 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4268 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4269 else if (id == CODING_ISO_INVOKED_CHARSET (coding, 1)) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4270 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4271 EMIT_TWO_BYTES ((c1) | 0x80, (c2) | 0x80); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4272 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4273 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4274 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4275 /* Since CHARSET is not yet invoked to any graphic planes, we \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4276 must invoke it, or, at first, designate it to some graphic \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4277 register. Then repeat the loop to actually produce the \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4278 character. */ \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4279 dst = encode_invocation_designation (charset, coding, dst, \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4280 &produced_chars); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4281 } while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4282
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4283
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4284 #define ENCODE_ISO_CHARACTER(charset, c) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4285 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4286 int code = ENCODE_CHAR ((charset),(c)); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4287 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4288 if (CHARSET_DIMENSION (charset) == 1) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4289 ENCODE_ISO_CHARACTER_DIMENSION1 ((charset), code); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4290 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4291 ENCODE_ISO_CHARACTER_DIMENSION2 ((charset), code >> 8, code & 0xFF); \
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
4292 } while (0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4293
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
4294
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4295 /* Produce designation and invocation codes at a place pointed by DST
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4296 to use CHARSET. The element `spec.iso_2022' of *CODING is updated.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4297 Return new DST. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4298
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4299 unsigned char *
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4300 encode_invocation_designation (charset, coding, dst, p_nchars)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4301 struct charset *charset;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4302 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4303 unsigned char *dst;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4304 int *p_nchars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4305 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4306 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4307 int produced_chars = *p_nchars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4308 int reg; /* graphic register number */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4309 int id = CHARSET_ID (charset);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4310
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4311 /* At first, check designations. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4312 for (reg = 0; reg < 4; reg++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4313 if (id == CODING_ISO_DESIGNATION (coding, reg))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4314 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4315
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4316 if (reg >= 4)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4317 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4318 /* CHARSET is not yet designated to any graphic registers. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4319 /* At first check the requested designation. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4320 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4321 if (reg < 0)
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
4322 /* Since CHARSET requests no special designation, designate it
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
4323 to graphic register 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4324 reg = 0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4325
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4326 ENCODE_DESIGNATION (charset, reg, coding);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4327 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4328
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4329 if (CODING_ISO_INVOCATION (coding, 0) != reg
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4330 && CODING_ISO_INVOCATION (coding, 1) != reg)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4331 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4332 /* Since the graphic register REG is not invoked to any graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4333 planes, invoke it to graphic plane 0. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4334 switch (reg)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4335 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4336 case 0: /* graphic register 0 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4337 ENCODE_SHIFT_IN;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4338 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4339
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4340 case 1: /* graphic register 1 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4341 ENCODE_SHIFT_OUT;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4342 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4343
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4344 case 2: /* graphic register 2 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4345 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4346 ENCODE_SINGLE_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4347 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4348 ENCODE_LOCKING_SHIFT_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4349 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4350
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4351 case 3: /* graphic register 3 */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4352 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_SINGLE_SHIFT)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4353 ENCODE_SINGLE_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4354 else
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4355 ENCODE_LOCKING_SHIFT_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4356 break;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4357 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4358 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4359
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4360 *p_nchars = produced_chars;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4361 return dst;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4362 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4363
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4364 /* The following three macros produce codes for indicating direction
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4365 of text. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4366 #define ENCODE_CONTROL_SEQUENCE_INTRODUCER \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4367 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4368 if (CODING_ISO_FLAGS (coding) == CODING_ISO_FLAG_SEVEN_BITS) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4369 EMIT_TWO_ASCII_BYTES (ISO_CODE_ESC, '['); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4370 else \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4371 EMIT_ONE_BYTE (ISO_CODE_CSI); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4372 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4373
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4374
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4375 #define ENCODE_DIRECTION_R2L() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4376 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4377 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4378 EMIT_TWO_ASCII_BYTES ('2', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4379 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4380
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4381
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4382 #define ENCODE_DIRECTION_L2R() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4383 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4384 ENCODE_CONTROL_SEQUENCE_INTRODUCER (dst); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4385 EMIT_TWO_ASCII_BYTES ('0', ']'); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4386 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4387
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4388
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4389 /* Produce codes for designation and invocation to reset the graphic
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4390 planes and registers to initial state. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4391 #define ENCODE_RESET_PLANE_AND_REGISTER() \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4392 do { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4393 int reg; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4394 struct charset *charset; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4395 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4396 if (CODING_ISO_INVOCATION (coding, 0) != 0) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4397 ENCODE_SHIFT_IN; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4398 for (reg = 0; reg < 4; reg++) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4399 if (CODING_ISO_INITIAL (coding, reg) >= 0 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4400 && (CODING_ISO_DESIGNATION (coding, reg) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4401 != CODING_ISO_INITIAL (coding, reg))) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4402 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4403 charset = CHARSET_FROM_ID (CODING_ISO_INITIAL (coding, reg)); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4404 ENCODE_DESIGNATION (charset, reg, coding); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4405 } \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4406 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4407
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4408
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4409 /* Produce designation sequences of charsets in the line started from
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4410 SRC to a place pointed by DST, and return updated DST.
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4411
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4412 If the current block ends before any end-of-line, we may fail to
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4413 find all the necessary designations. */
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
4414
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4415 static unsigned char *
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4416 encode_designation_at_bol (coding, charbuf, charbuf_end, dst)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4417 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4418 int *charbuf, *charbuf_end;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
4419 unsigned char *dst;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4420 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4421 struct charset *charset;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4422 /* Table of charsets to be designated to each graphic register. */
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4423 int r[4];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4424 int c, found = 0, reg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4425 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4426 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4427 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4428 Lisp_Object charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4429
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4430 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4431 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4432 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4433 charset_list = Viso_2022_charset_list;
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4434
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4435 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4436 r[reg] = -1;
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4437
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4438 while (found < 4)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4439 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4440 int id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4441
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4442 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4443 if (c == '\n')
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4444 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4445 charset = char_charset (c, charset_list, NULL);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4446 id = CHARSET_ID (charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4447 reg = CODING_ISO_REQUEST (coding, id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4448 if (reg >= 0 && r[reg] < 0)
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4449 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4450 found++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4451 r[reg] = id;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4452 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4453 }
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4454
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4455 if (found)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4456 {
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4457 for (reg = 0; reg < 4; reg++)
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4458 if (r[reg] >= 0
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4459 && CODING_ISO_DESIGNATION (coding, reg) != r[reg])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4460 ENCODE_DESIGNATION (CHARSET_FROM_ID (r[reg]), reg, coding);
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4461 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4462
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4463 return dst;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4464 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4465
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4466 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions". */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4467
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4468 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4469 encode_coding_iso_2022 (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4470 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4471 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4472 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4473 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4474 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4475 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4476 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4477 int safe_room = 16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4478 int bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4479 = (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4480 && CODING_ISO_BOL (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4481 int produced_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4482 Lisp_Object attrs, eol_type, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4483 int ascii_compatible;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4484 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4485 int preferred_charset_id = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4486
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4487 CODING_GET_INFO (coding, attrs, charset_list);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4488 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4489 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4490 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4491
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
4492 setup_iso_safe_charsets (attrs);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4493 /* Charset list may have been changed. */
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
4494 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
4495 coding->safe_charsets = SDATA (CODING_ATTR_SAFE_CHARSETS (attrs));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4496
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4497 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4498
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4499 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4500 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4501 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4502
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4503 if (bol_designation)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4504 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4505 unsigned char *dst_prev = dst;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4506
17725
92f042f73be2 (Valternate_charset_table): The valiable deleted.
Kenichi Handa <handa@m17n.org>
parents: 17717
diff changeset
4507 /* We have to produce designation sequences if any now. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4508 dst = encode_designation_at_bol (coding, charbuf, charbuf_end, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4509 bol_designation = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4510 /* We are sure that designation sequences are all ASCII bytes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4511 produced_chars += dst - dst_prev;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4512 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
4513
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4514 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4515
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4516 if (c < 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4517 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4518 /* Handle an annotation. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4519 switch (*charbuf)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4520 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4521 case CODING_ANNOTATE_COMPOSITION_MASK:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4522 /* Not yet implemented. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4523 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4524 case CODING_ANNOTATE_CHARSET_MASK:
90014
ade0c9a12f99 (encode_coding_iso_2022): Fix handling of charset
Kenichi Handa <handa@m17n.org>
parents: 90011
diff changeset
4525 preferred_charset_id = charbuf[2];
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4526 if (preferred_charset_id >= 0
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4527 && NILP (Fmemq (make_number (preferred_charset_id),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4528 charset_list)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4529 preferred_charset_id = -1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4530 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4531 default:
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4532 abort ();
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
4533 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4534 charbuf += -c - 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4535 continue;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4536 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4537
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4538 /* Now encode the character C. */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4539 if (c < 0x20 || c == 0x7F)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4540 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4541 if (c == '\n'
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4542 || (c == '\r' && EQ (eol_type, Qmac)))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4543 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4544 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4545 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4546 if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_INIT_AT_BOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4547 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4548 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4549
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4550 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4551 CODING_ISO_DESIGNATION (coding, i)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4552 = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4553 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4554 bol_designation
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4555 = CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_DESIGNATE_AT_BOL;
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4556 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4557 else if (CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_CNTL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4558 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4559 EMIT_ONE_ASCII_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4560 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4561 else if (ASCII_CHAR_P (c))
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4562 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4563 if (ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4564 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4565 else
88681
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4566 {
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4567 struct charset *charset = CHARSET_FROM_ID (charset_ascii);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4568 ENCODE_ISO_CHARACTER (charset, c);
2cdfbffa8a0d (CODING_ISO_FLAG_USE_ROMAN): New macro
Kenichi Handa <handa@m17n.org>
parents: 88669
diff changeset
4569 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4570 }
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4571 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4572 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4573 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4574 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
4575 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4576 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4577 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4578 struct charset *charset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4579
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4580 if (preferred_charset_id >= 0)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4581 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4582 charset = CHARSET_FROM_ID (preferred_charset_id);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4583 if (! CHAR_CHARSET_P (c, charset))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4584 charset = char_charset (c, charset_list, NULL);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4585 }
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
4586 else
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4587 charset = char_charset (c, charset_list, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4588 if (!charset)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4589 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4590 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4591 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4592 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4593 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4594 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4595 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4596 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4597 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4598 charset = char_charset (c, charset_list, NULL);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
4599 }
19052
302a7b2a6948 (encode_coding_iso2022): Write out invalid multibyte
Kenichi Handa <handa@m17n.org>
parents: 18910
diff changeset
4600 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4601 ENCODE_ISO_CHARACTER (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4602 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4603 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4604
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4605 if (coding->mode & CODING_MODE_LAST_BLOCK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4606 && CODING_ISO_FLAGS (coding) & CODING_ISO_FLAG_RESET_AT_EOL)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4607 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4608 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4609 ENCODE_RESET_PLANE_AND_REGISTER ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4610 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4611 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4612 CODING_ISO_BOL (coding) = bol_designation;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4613 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4614 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4615 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4616 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4617
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4618
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4619 /*** 8,9. SJIS and BIG5 handlers ***/
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4620
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4621 /* Although SJIS and BIG5 are not ISO's coding system, they are used
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4622 quite widely. So, for the moment, Emacs supports them in the bare
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4623 C code. But, in the future, they may be supported only by CCL. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4624
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4625 /* SJIS is a coding system encoding three character sets: ASCII, right
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4626 half of JISX0201-Kana, and JISX0208. An ASCII character is encoded
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4627 as is. A character of charset katakana-jisx0201 is encoded by
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4628 "position-code + 0x80". A character of charset japanese-jisx0208
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4629 is encoded in 2-byte but two position-codes are divided and shifted
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4630 so that it fit in the range below.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4631
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4632 --- CODE RANGE of SJIS ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4633 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4634 ASCII 0x00 .. 0x7F
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4635 KATAKANA-JISX0201 0xA0 .. 0xDF
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
4636 JISX0208 (1st byte) 0x81 .. 0x9F and 0xE0 .. 0xEF
23564
6eb3e346d1fd (DECODE_CHARACTER_ASCII): Check validity of inserted
Kenichi Handa <handa@m17n.org>
parents: 23542
diff changeset
4637 (2nd byte) 0x40 .. 0x7E and 0x80 .. 0xFC
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4638 -------------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4639
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4640 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4641
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4642 /* BIG5 is a coding system encoding two character sets: ASCII and
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4643 Big5. An ASCII character is encoded as is. Big5 is a two-byte
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4644 character set and is encoded in two-byte.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4645
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4646 --- CODE RANGE of BIG5 ---
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4647 (character set) (range)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4648 ASCII 0x00 .. 0x7F
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4649 Big5 (1st byte) 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4650 (2nd byte) 0x40 .. 0x7E and 0xA1 .. 0xFE
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4651 --------------------------
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4652
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4653 */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4654
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4655 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4656 Check if a text is encoded in SJIS. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4657 CATEGORY_MASK_SJIS, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4658
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4659 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4660 detect_coding_sjis (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4661 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4662 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4663 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4664 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4665 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4666 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4667 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4668 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4669 int c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4670
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4671 detect_info->checked |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4672 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4673 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4674
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4675 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4676 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4677 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4678 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4679 if (c < 0x80)
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4680 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4681 if ((c >= 0x81 && c <= 0x9F) || (c >= 0xE0 && c <= 0xEF))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4682 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4683 ONE_MORE_BYTE (c);
36647
0a75ccbe42b2 (detect_coding_sjis): Do more rigid check.
Kenichi Handa <handa@m17n.org>
parents: 36520
diff changeset
4684 if (c < 0x40 || c == 0x7F || c > 0xFC)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4685 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4686 found = CATEGORY_MASK_SJIS;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4687 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4688 else if (c >= 0xA0 && c < 0xE0)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4689 found = CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4690 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4691 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4692 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4693 detect_info->rejected |= CATEGORY_MASK_SJIS;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4694 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4695
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4696 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4697 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4698 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4699 detect_info->rejected |= CATEGORY_MASK_SJIS;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4700 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4701 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4702 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4703 return 1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4704 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4705
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4706 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4707 Check if a text is encoded in BIG5. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4708 CATEGORY_MASK_BIG5, else return 0. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4709
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
4710 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4711 detect_coding_big5 (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4712 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4713 struct coding_detection_info *detect_info;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4714 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4715 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4716 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4717 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4718 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4719 int found = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4720 int c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4721
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4722 detect_info->checked |= CATEGORY_MASK_BIG5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4723 /* A coding system of this category is always ASCII compatible. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4724 src += coding->head_ascii;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4725
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4726 while (1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4727 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4728 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4729 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4730 if (c < 0x80)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4731 continue;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4732 if (c >= 0xA1)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4733 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4734 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4735 if (c < 0x40 || (c >= 0x7F && c <= 0xA0))
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4736 return 0;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4737 found = CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4738 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4739 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4740 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4741 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4742 detect_info->rejected |= CATEGORY_MASK_BIG5;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4743 return 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4744
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4745 no_more_source:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4746 if (src_base < src && coding->mode & CODING_MODE_LAST_BLOCK)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4747 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4748 detect_info->rejected |= CATEGORY_MASK_BIG5;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4749 return 0;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4750 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4751 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4752 return 1;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4753 }
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
4754
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4755 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions".
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4756 If SJIS_P is 1, decode SJIS text, else decode BIG5 test. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4757
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4758 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4759 decode_coding_sjis (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4760 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4761 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4762 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4763 const unsigned char *src_end = coding->source + coding->src_bytes;
59168
0345f2b10f1d (decode_coding_XXX, decode_composition_emacs_mule)
Dan Nicolaescu <dann@ics.uci.edu>
parents: 59095
diff changeset
4764 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4765 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4766 /* We may produce one charset annocation in one loop and one more at
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4767 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4768 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4769 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4770 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4771 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4772 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4773 struct charset *charset_kanji2;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4774 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4775 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4776 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4777 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4778 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4779 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4780 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4781
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4782 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4783
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4784 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4785 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
4786 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4787 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4788 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4789
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4790 while (1)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4791 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4792 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4793 struct charset *charset;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4794
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4795 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4796 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4797
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4798 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4799 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4800 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4801 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4802 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4803 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4804
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4805 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4806 c = byte_after_cr, byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4807 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4808 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4809 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4810 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4811 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4812 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4813 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4814 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4815 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4816 }
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4817 else if (c == 0x80 || c == 0xA0)
89730
d8fcefca5cf6 (decode_coding_sjis): Check the first byte rigidly.
Kenichi Handa <handa@m17n.org>
parents: 89686
diff changeset
4818 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4819 else if (c >= 0xA1 && c <= 0xDF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4820 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4821 /* SJIS -> JISX0201-Kana */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4822 c &= 0x7F;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4823 charset = charset_kana;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4824 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4825 else if (c <= 0xEF)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4826 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4827 /* SJIS -> JISX0208 */
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4828 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4829 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4830 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4831 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4832 SJIS_TO_JIS (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4833 charset = charset_kanji;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4834 }
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4835 else if (c <= 0xFC && charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4836 {
89779
74c503490829 (decode_coding_sjis): Fix comment.
Kenichi Handa <handa@m17n.org>
parents: 89764
diff changeset
4837 /* SJIS -> JISX0213-2 */
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4838 ONE_MORE_BYTE (c1);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4839 if (c1 < 0x40 || c1 == 0x7F || c1 > 0xFC)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4840 goto invalid_code;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4841 c = (c << 8) | c1;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4842 SJIS_TO_JIS2 (c);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4843 charset = charset_kanji2;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4844 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4845 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4846 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4847 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4848 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4849 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4850 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4851 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4852 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4853 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4854 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4855 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4856 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4857 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4858 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4859
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4860 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4861 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4862 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4863 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4864 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4865 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4866 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4867 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4868
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4869 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4870 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4871 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4872 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4873 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4874 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4875 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4876
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4877 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4878 decode_coding_big5 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4879 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4880 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4881 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4882 const unsigned char *src_end = coding->source + coding->src_bytes;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
4883 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4884 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4885 /* We may produce one charset annocation in one loop and one more at
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4886 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4887 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
4888 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4889 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4890 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4891 struct charset *charset_roman, *charset_big5;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4892 Lisp_Object attrs, charset_list, val;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4893 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4894 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4895 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4896 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
4897 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4898 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4899
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4900 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4901 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4902 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4903 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4904
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4905 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4906 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4907 int c, c1;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4908 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4909
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4910 src_base = src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4911 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4912
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4913 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4914 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4915 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4916 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4917 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
4918 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4919
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4920 if (byte_after_cr >= 0)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4921 c = byte_after_cr, byte_after_cr = -1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4922 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4923 ONE_MORE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4924
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4925 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4926 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4927 if (c < 0x80)
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4928 {
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
4929 if (eol_crlf && c == '\r')
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4930 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4931 charset = charset_roman;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
4932 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4933 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4934 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4935 /* BIG5 -> Big5 */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4936 if (c < 0xA1 || c > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4937 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4938 ONE_MORE_BYTE (c1);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4939 if (c1 < 0x40 || (c1 > 0x7E && c1 < 0xA1) || c1 > 0xFE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4940 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4941 c = c << 8 | c1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4942 charset = charset_big5;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4943 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4944 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4945 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4946 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4947 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4948 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4949 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4950 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4951 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4952 CODING_DECODE_CHAR (coding, src, src_base, src_end, charset, c, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4953 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4954 char_offset++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4955 continue;
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
4956
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4957 invalid_code:
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4958 src = src_base;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4959 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4960 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
4961 *charbuf++ = c < 0 ? -c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4962 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4963 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4964 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4965
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4966 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
4967 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
4968 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4969 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4970 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4971 coding->charbuf_used = charbuf - coding->charbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4972 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4973
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4974 /* See the above "GENERAL NOTES on `encode_coding_XXX ()' functions".
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4975 This function can encode charsets `ascii', `katakana-jisx0201',
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4976 `japanese-jisx0208', `chinese-big5-1', and `chinese-big5-2'. We
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
4977 are sure that all these charsets are registered as official charset
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4978 (i.e. do not have extended leading-codes). Characters of other
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4979 charsets are produced without any encoding. If SJIS_P is 1, encode
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4980 SJIS text, else encode BIG5 text. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4981
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4982 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4983 encode_coding_sjis (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4984 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
4985 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4986 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4987 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4988 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4989 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4990 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4991 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4992 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4993 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4994 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4995 struct charset *charset_roman, *charset_kanji, *charset_kana;
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
4996 struct charset *charset_kanji2;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4997 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
4998
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
4999 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5000 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5001 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5002 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5003 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5004 charset_kanji2 = NILP (val) ? NULL : CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5005
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5006 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5007
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5008 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5009 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5010 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5011 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5012 /* Now encode the character C. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5013 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5014 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5015 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5016 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5017 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5018 EMIT_ONE_BYTE (c);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5019 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5020 else
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5021 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5022 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5023 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5024
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5025 if (!charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5026 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5027 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5028 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5029 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5030 charset = CHARSET_FROM_ID (charset_ascii);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5031 }
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5032 else
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5033 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5034 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5035 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5036 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5037 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5038 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5039 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5040 if (charset == charset_kanji)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5041 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5042 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5043 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5044 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5045 EMIT_TWO_BYTES (c1, c2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5046 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5047 else if (charset == charset_kana)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5048 EMIT_ONE_BYTE (code | 0x80);
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5049 else if (charset_kanji2 && charset == charset_kanji2)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5050 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5051 int c1, c2;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5052
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5053 c1 = code >> 8;
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5054 if (c1 == 0x21 || (c1 >= 0x23 && c1 < 0x25)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5055 || (c1 >= 0x2C && c1 <= 0x2F) || c1 >= 0x6E)
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5056 {
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5057 JIS_TO_SJIS2 (code);
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5058 c1 = code >> 8, c2 = code & 0xFF;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5059 EMIT_TWO_BYTES (c1, c2);
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5060 }
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5061 else
89764
e3d26232ab78 (decode_coding_sjis): Handle 4th charset (typically JISX0212).
Kenichi Handa <handa@m17n.org>
parents: 89759
diff changeset
5062 EMIT_ONE_ASCII_BYTE (code & 0x7F);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5063 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5064 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5065 EMIT_ONE_ASCII_BYTE (code & 0x7F);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5066 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5067 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5068 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5069 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5070 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5071 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5072 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5073
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5074 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5075 encode_coding_big5 (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5076 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5077 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5078 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5079 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5080 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5081 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5082 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5083 int safe_room = 4;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5084 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5085 Lisp_Object attrs, charset_list, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5086 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5087 struct charset *charset_roman, *charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5088 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5089
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5090 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5091 val = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5092 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5093 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5094 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5095
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5096 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5097 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5098 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5099 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5100 /* Now encode the character C. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5101 if (ASCII_CHAR_P (c) && ascii_compatible)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5102 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5103 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5104 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5105 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5106 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5107 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5108 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5109 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5110 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5111 struct charset *charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5112
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5113 if (! charset)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5114 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5115 if (coding->mode & CODING_MODE_SAFE_ENCODING)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5116 {
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5117 code = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5118 charset = CHARSET_FROM_ID (charset_ascii);
51140
94d903190cee (ENCODE_UNSAFE_CHARACTER): Adjusted for the name change
Kenichi Handa <handa@m17n.org>
parents: 51090
diff changeset
5119 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5120 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5121 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5122 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5123 charset = char_charset (c, charset_list, &code);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5124 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5125 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5126 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5127 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5128 if (charset == charset_big5)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5129 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5130 int c1, c2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5131
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5132 c1 = code >> 8, c2 = code & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5133 EMIT_TWO_BYTES (c1, c2);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5134 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5135 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5136 EMIT_ONE_ASCII_BYTE (code & 0x7F);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5137 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5138 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5139 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5140 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5141 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5142 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5143 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5144
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5145
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5146 /*** 10. CCL handlers ***/
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5147
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5148 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5149 Check if a text is encoded in a coding system of which
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5150 encoder/decoder are written in CCL program. If it is, return
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5151 CATEGORY_MASK_CCL, else return 0. */
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5152
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
5153 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5154 detect_coding_ccl (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5155 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5156 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5157 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5158 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5159 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5160 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5161 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5162 int found = 0;
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
5163 unsigned char *valids;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5164 int head_ascii = coding->head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5165 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5166
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5167 detect_info->checked |= CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5168
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5169 coding = &coding_categories[coding_category_ccl];
89848
3edfa038a435 (detect_coding_emacs_mule): Fix counting of encoded
Kenichi Handa <handa@m17n.org>
parents: 89842
diff changeset
5170 valids = CODING_CCL_VALIDS (coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5171 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5172 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5173 src += head_ascii;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5174
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5175 while (1)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5176 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5177 int c;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5178
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5179 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5180 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5181 if (c < 0 || ! valids[c])
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5182 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5183 if ((valids[c] > 1))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5184 found = CATEGORY_MASK_CCL;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5185 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5186 detect_info->rejected |= CATEGORY_MASK_CCL;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5187 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5188
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5189 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5190 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5191 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5192 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5193
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5194 static void
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5195 decode_coding_ccl (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5196 struct coding_system *coding;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5197 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
5198 const unsigned char *src = coding->source + coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5199 const unsigned char *src_end = coding->source + coding->src_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5200 int *charbuf = coding->charbuf + coding->charbuf_used;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5201 int *charbuf_end = coding->charbuf + coding->charbuf_size;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5202 int consumed_chars = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5203 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5204 struct ccl_program ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5205 int source_charbuf[1024];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5206 int source_byteidx[1024];
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5207 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5208
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5209 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5210 setup_ccl_program (&ccl, CODING_CCL_DECODER (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5211
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5212 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5213 {
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
5214 const unsigned char *p = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5215 int *source, *source_end;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5216 int i = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5217
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5218 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5219 while (i < 1024 && p < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5220 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5221 source_byteidx[i] = p - src;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5222 source_charbuf[i++] = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5223 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5224 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5225 while (i < 1024 && p < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5226 source_charbuf[i++] = *p++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5227
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5228 if (p == src_end && coding->mode & CODING_MODE_LAST_BLOCK)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5229 ccl.last_block = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5230
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5231 source = source_charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5232 source_end = source + i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5233 while (source < source_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5234 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5235 ccl_driver (&ccl, source, charbuf,
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
5236 source_end - source, charbuf_end - charbuf,
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
5237 charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5238 source += ccl.consumed;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5239 charbuf += ccl.produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5240 if (ccl.status != CCL_STAT_SUSPEND_BY_DST)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5241 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5242 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5243 if (source < source_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5244 src += source_byteidx[source - source_charbuf];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5245 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5246 src = p;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5247 consumed_chars += source - source_charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5248
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5249 if (ccl.status != CCL_STAT_SUSPEND_BY_SRC
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5250 && ccl.status != CODING_RESULT_INSUFFICIENT_SRC)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5251 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5252 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5253
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5254 switch (ccl.status)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5255 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5256 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5257 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5258 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5259 case CCL_STAT_SUSPEND_BY_DST:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5260 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5261 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5262 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5263 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5264 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5265 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5266 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5267 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5268 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5269 coding->consumed_char += consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5270 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5271 coding->charbuf_used = charbuf - coding->charbuf;
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5272 }
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5273
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5274 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5275 encode_coding_ccl (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5276 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5277 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5278 struct ccl_program ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5279 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5280 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5281 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5282 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5283 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5284 int destination_charbuf[1024];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5285 int i, produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5286 Lisp_Object attrs, charset_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5287
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5288 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5289 setup_ccl_program (&ccl, CODING_CCL_ENCODER (coding));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5290
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5291 ccl.last_block = coding->mode & CODING_MODE_LAST_BLOCK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5292 ccl.dst_multibyte = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5293
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5294 while (charbuf < charbuf_end)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5295 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5296 ccl_driver (&ccl, charbuf, destination_charbuf,
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5297 charbuf_end - charbuf, 1024, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5298 if (multibytep)
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5299 {
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5300 ASSURE_DESTINATION (ccl.produced * 2);
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5301 for (i = 0; i < ccl.produced; i++)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5302 EMIT_ONE_BYTE (destination_charbuf[i] & 0xFF);
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5303 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5304 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5305 {
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5306 ASSURE_DESTINATION (ccl.produced);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
5307 for (i = 0; i < ccl.produced; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5308 *dst++ = destination_charbuf[i] & 0xFF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5309 produced_chars += ccl.produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5310 }
90346
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5311 charbuf += ccl.consumed;
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5312 if (ccl.status == CCL_STAT_QUIT
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5313 || ccl.status == CCL_STAT_INVALID_CMD)
bba59a8cdae0 (encode_coding_ccl): Allocate destination dynamically
Kenichi Handa <handa@m17n.org>
parents: 90336
diff changeset
5314 break;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5315 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5316
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5317 switch (ccl.status)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5318 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5319 case CCL_STAT_SUSPEND_BY_SRC:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5320 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5321 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5322 case CCL_STAT_SUSPEND_BY_DST:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5323 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5324 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5325 case CCL_STAT_QUIT:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5326 case CCL_STAT_INVALID_CMD:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5327 record_conversion_result (coding, CODING_RESULT_INTERRUPT);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5328 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5329 default:
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5330 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5331 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5332 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5333
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5334 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5335 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5336 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5337 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5338
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5339
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5340
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5341 /*** 10, 11. no-conversion handlers ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5342
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5343 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions". */
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5344
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5345 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5346 decode_coding_raw_text (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5347 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5348 {
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5349 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5350 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5351
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5352 coding->chars_at_source = 1;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5353 coding->consumed_char = coding->src_chars;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5354 coding->consumed = coding->src_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5355 if (eol_crlf && coding->source[coding->src_bytes - 1] == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5356 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5357 coding->consumed_char--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5358 coding->consumed--;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5359 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_SRC);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5360 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5361 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5362 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5363 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5364
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5365 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5366 encode_coding_raw_text (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5367 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5368 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5369 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5370 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5371 int *charbuf_end = coding->charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5372 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5373 unsigned char *dst_end = coding->destination + coding->dst_bytes;
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
5374 int produced_chars = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5375 int c;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5376
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5377 if (multibytep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5378 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5379 int safe_room = MAX_MULTIBYTE_LENGTH * 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5380
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5381 if (coding->src_multibyte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5382 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5383 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5384 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5385 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5386 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5387 EMIT_ONE_ASCII_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5388 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5389 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5390 c = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5391 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5392 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5393 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5394 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5395 unsigned char str[MAX_MULTIBYTE_LENGTH], *p0 = str, *p1 = str;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5396
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5397 CHAR_STRING_ADVANCE (c, p1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5398 while (p0 < p1)
88950
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5399 {
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5400 EMIT_ONE_BYTE (*p0);
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5401 p0++;
ad258ee59fbb * coding.c (make_conversion_work_buffer): Adjusted for the change
Kenichi Handa <handa@m17n.org>
parents: 88936
diff changeset
5402 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5403 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5404 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5405 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5406 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5407 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5408 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5409 c = *charbuf++;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5410 EMIT_ONE_BYTE (c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5411 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5412 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5413 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5414 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5415 if (coding->src_multibyte)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5416 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5417 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5418
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5419 while (charbuf < charbuf_end)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5420 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5421 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5422 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5423 if (ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5424 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5425 else if (CHAR_BYTE8_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5426 *dst++ = CHAR_TO_BYTE8 (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5427 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5428 CHAR_STRING_ADVANCE (c, dst);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5429 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5430 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5431 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5432 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5433 ASSURE_DESTINATION (charbuf_end - charbuf);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5434 while (charbuf < charbuf_end && dst < dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5435 *dst++ = *charbuf++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5436 }
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
5437 produced_chars = dst - (coding->destination + coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5438 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5439 record_conversion_result (coding, CODING_RESULT_SUCCESS);
95345
0350e5efb8f7 (encode_coding_raw_text): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 95344
diff changeset
5440 coding->produced_char += produced_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5441 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5442 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5443 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5444
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5445 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5446 Check if a text is encoded in a charset-based coding system. If it
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5447 is, return 1, else return 0. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5448
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5449 static int
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5450 detect_coding_charset (coding, detect_info)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5451 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5452 struct coding_detection_info *detect_info;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5453 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5454 const unsigned char *src = coding->source, *src_base;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5455 const unsigned char *src_end = coding->source + coding->src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5456 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5457 int consumed_chars = 0;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5458 Lisp_Object attrs, valids, name;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5459 int found = 0;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5460 int head_ascii = coding->head_ascii;
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5461 int check_latin_extra = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5462
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5463 detect_info->checked |= CATEGORY_MASK_CHARSET;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5464
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5465 coding = &coding_categories[coding_category_charset];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5466 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5467 valids = AREF (attrs, coding_attr_charset_valids);
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5468 name = CODING_ID_NAME (coding->id);
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5469 if (strncmp ((char *) SDATA (SYMBOL_NAME (name)),
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5470 "iso-8859-", sizeof ("iso-8859-") - 1) == 0
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5471 || strncmp ((char *) SDATA (SYMBOL_NAME (name)),
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5472 "iso-latin-", sizeof ("iso-latin-") - 1) == 0)
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5473 check_latin_extra = 1;
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5474
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5475 if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5476 src += head_ascii;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5477
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5478 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5479 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5480 int c;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5481 Lisp_Object val;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5482 struct charset *charset;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5483 int dim, idx;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5484
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5485 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5486 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5487 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5488 continue;
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5489 val = AREF (valids, c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5490 if (NILP (val))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5491 break;
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
5492 if (c >= 0x80)
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5493 {
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5494 if (c < 0xA0
102327
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5495 && check_latin_extra
a1f0d8fadbb1 (detect_coding_charset): Fix last change for non-latin charsets.
Jason Rumney <jasonr@gnu.org>
parents: 102325
diff changeset
5496 && (!VECTORP (Vlatin_extra_code_table)
102325
2c693a021d83 (detect_coding_charset): If not checking latin extra,
Jason Rumney <jasonr@gnu.org>
parents: 102320
diff changeset
5497 || NILP (XVECTOR (Vlatin_extra_code_table)->contents[c])))
98951
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5498 break;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5499 found = CATEGORY_MASK_CHARSET;
71becd1e9707 (detect_coding_charset): For iso-8859-* coding systems,
Kenichi Handa <handa@m17n.org>
parents: 98186
diff changeset
5500 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5501 if (INTEGERP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5502 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5503 charset = CHARSET_FROM_ID (XFASTINT (val));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5504 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5505 for (idx = 1; idx < dim; idx++)
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5506 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5507 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5508 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5509 ONE_MORE_BYTE (c);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
5510 if (c < charset->code_space[(dim - 1 - idx) * 2]
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5511 || c > charset->code_space[(dim - 1 - idx) * 2 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5512 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5513 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5514 if (idx < dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5515 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5516 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5517 else
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5518 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5519 idx = 1;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5520 for (; CONSP (val); val = XCDR (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5521 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5522 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5523 dim = CHARSET_DIMENSION (charset);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5524 while (idx < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5525 {
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5526 if (src == src_end)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5527 goto too_short;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5528 ONE_MORE_BYTE (c);
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5529 if (c < charset->code_space[(dim - 1 - idx) * 4]
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5530 || c > charset->code_space[(dim - 1 - idx) * 4 + 1])
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5531 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5532 idx++;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5533 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5534 if (idx == dim)
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5535 {
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5536 val = Qnil;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5537 break;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5538 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5539 }
90651
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5540 if (CONSP (val))
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5541 break;
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5542 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5543 }
23c1467f8640 (detect_coding_charset): Fix detection of multi-byte
Kenichi Handa <handa@m17n.org>
parents: 90599
diff changeset
5544 too_short:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5545 detect_info->rejected |= CATEGORY_MASK_CHARSET;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5546 return 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5547
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5548 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5549 detect_info->found |= found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5550 return 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5551 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5552
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5553 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5554 decode_coding_charset (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5555 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5556 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5557 const unsigned char *src = coding->source + coding->consumed;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5558 const unsigned char *src_end = coding->source + coding->src_bytes;
46548
cb1914307488 (encode_eol, detect_coding, detect_eol):
Ken Raeburn <raeburn@raeburn.org>
parents: 46462
diff changeset
5559 const unsigned char *src_base;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5560 int *charbuf = coding->charbuf + coding->charbuf_used;
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
5561 /* We may produce one charset annocation in one loop and one more at
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
5562 the end. */
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5563 int *charbuf_end
103035
6e443d717c7b (decode_coding_utf_16): Reduce charbuf_end for the
Kenichi Handa <handa@m17n.org>
parents: 102738
diff changeset
5564 = coding->charbuf + coding->charbuf_size - (MAX_ANNOTATION_LENGTH * 2);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5565 int consumed_chars = 0, consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5566 int multibytep = coding->src_multibyte;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5567 Lisp_Object attrs, charset_list, valids;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5568 int char_offset = coding->produced_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5569 int last_offset = char_offset;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5570 int last_id = charset_ascii;
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5571 int eol_crlf =
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5572 !inhibit_eol_conversion && EQ (CODING_ID_EOL_TYPE (coding->id), Qdos);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5573 int byte_after_cr = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5574
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5575 CODING_GET_INFO (coding, attrs, charset_list);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5576 valids = AREF (attrs, coding_attr_charset_valids);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5577
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5578 while (1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5579 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5580 int c;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5581 Lisp_Object val;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5582 struct charset *charset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5583 int dim;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5584 int len = 1;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5585 unsigned code;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5586
29093
176708661b08 (encode_eol): Fix a bug of DOS style EOL encoding.
Kenichi Handa <handa@m17n.org>
parents: 29005
diff changeset
5587 src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5588 consumed_chars_base = consumed_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5589
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5590 if (charbuf >= charbuf_end)
100936
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5591 {
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5592 if (byte_after_cr >= 0)
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5593 src_base--;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5594 break;
5c5e6d041634 (decode_coding_utf_8): Check byte_after_cr before breaking the loop.
Kenichi Handa <handa@m17n.org>
parents: 100587
diff changeset
5595 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5596
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5597 if (byte_after_cr >= 0)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5598 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5599 c = byte_after_cr;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5600 byte_after_cr = -1;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5601 }
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5602 else
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5603 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5604 ONE_MORE_BYTE (c);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5605 if (eol_crlf && c == '\r')
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5606 ONE_MORE_BYTE (byte_after_cr);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
5607 }
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5608 if (c < 0)
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5609 goto invalid_code;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5610 code = c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5611
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5612 val = AREF (valids, c);
100170
86455974b971 (decode_coding_charset): Check type of an element of
Kenichi Handa <handa@m17n.org>
parents: 100135
diff changeset
5613 if (! INTEGERP (val) && ! CONSP (val))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5614 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5615 if (INTEGERP (val))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5616 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5617 charset = CHARSET_FROM_ID (XFASTINT (val));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5618 dim = CHARSET_DIMENSION (charset);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5619 while (len < dim)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5620 {
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
5621 ONE_MORE_BYTE (c);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5622 code = (code << 8) | c;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5623 len++;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5624 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5625 CODING_DECODE_CHAR (coding, src, src_base, src_end,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5626 charset, code, c);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5627 }
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
5628 else
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5629 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5630 /* VAL is a list of charset IDs. It is assured that the
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5631 list is sorted by charset dimensions (smaller one
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5632 comes first). */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5633 while (CONSP (val))
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5634 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5635 charset = CHARSET_FROM_ID (XFASTINT (XCAR (val)));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
5636 dim = CHARSET_DIMENSION (charset);
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5637 while (len < dim)
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5638 {
88598
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5639 ONE_MORE_BYTE (c);
b88195f69856 (decode_coding_charset): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88597
diff changeset
5640 code = (code << 8) | c;
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
5641 len++;
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5642 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5643 CODING_DECODE_CHAR (coding, src, src_base,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5644 src_end, charset, code, c);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5645 if (c >= 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5646 break;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5647 val = XCDR (val);
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5648 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5649 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5650 if (c < 0)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5651 goto invalid_code;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5652 if (charset->id != charset_ascii
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5653 && last_id != charset->id)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5654 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5655 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5656 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5657 last_id = charset->id;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5658 last_offset = char_offset;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5659 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5660
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5661 *charbuf++ = c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5662 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5663 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5664
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5665 invalid_code:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5666 src = src_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5667 consumed_chars = consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5668 ONE_MORE_BYTE (c);
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5669 *charbuf++ = c < 0 ? -c : ASCII_BYTE_P (c) ? c : BYTE8_TO_CHAR (c);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5670 char_offset++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5671 coding->errors++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5672 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5673
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5674 no_more_source:
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5675 if (last_id != charset_ascii)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
5676 ADD_CHARSET_DATA (charbuf, char_offset - last_offset, last_id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5677 coding->consumed_char += consumed_chars_base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5678 coding->consumed = src_base - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5679 coding->charbuf_used = charbuf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5680 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5681
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5682 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5683 encode_coding_charset (coding)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5684 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5685 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5686 int multibytep = coding->dst_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5687 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5688 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5689 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5690 unsigned char *dst_end = coding->destination + coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5691 int safe_room = MAX_MULTIBYTE_LENGTH;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5692 int produced_chars = 0;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5693 Lisp_Object attrs, charset_list;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5694 int ascii_compatible;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5695 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5696
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
5697 CODING_GET_INFO (coding, attrs, charset_list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5698 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5699
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5700 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5701 {
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5702 struct charset *charset;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5703 unsigned code;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5704
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5705 ASSURE_DESTINATION (safe_room);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5706 c = *charbuf++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5707 if (ascii_compatible && ASCII_CHAR_P (c))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5708 EMIT_ONE_ASCII_BYTE (c);
88690
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5709 else if (CHAR_BYTE8_P (c))
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5710 {
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5711 c = CHAR_TO_BYTE8 (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5712 EMIT_ONE_BYTE (c);
7f284ac55b07 (encode_coding_emacs_mule): Pay attention to raw-8-bit chars.
Kenichi Handa <handa@m17n.org>
parents: 88681
diff changeset
5713 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5714 else
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5715 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5716 charset = char_charset (c, charset_list, &code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5717 if (charset)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5718 {
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5719 if (CHARSET_DIMENSION (charset) == 1)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5720 EMIT_ONE_BYTE (code);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5721 else if (CHARSET_DIMENSION (charset) == 2)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5722 EMIT_TWO_BYTES (code >> 8, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5723 else if (CHARSET_DIMENSION (charset) == 3)
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5724 EMIT_THREE_BYTES (code >> 16, (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5725 else
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5726 EMIT_FOUR_BYTES (code >> 24, (code >> 16) & 0xFF,
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5727 (code >> 8) & 0xFF, code & 0xFF);
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5728 }
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5729 else
88573
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5730 {
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5731 if (coding->mode & CODING_MODE_SAFE_ENCODING)
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5732 c = CODING_INHIBIT_CHARACTER_SUBSTITUTION;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5733 else
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5734 c = coding->default_char;
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5735 EMIT_ONE_BYTE (c);
133bf7ab1bad (encode_coding_iso_2022): If coding requires safe
Kenichi Handa <handa@m17n.org>
parents: 88544
diff changeset
5736 }
88465
ae455bb40718 (decode_coding_charset, encode_coding_charset): Handle
Kenichi Handa <handa@m17n.org>
parents: 88456
diff changeset
5737 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5738 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5739
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
5740 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5741 coding->produced_char += produced_chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5742 coding->produced = dst - coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5743 return 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5744 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5745
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5746
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
5747 /*** 7. C library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5748
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5749 /* Setup coding context CODING from information about CODING_SYSTEM.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5750 If CODING_SYSTEM is nil, `no-conversion' is assumed. If
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5751 CODING_SYSTEM is invalid, signal an error. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5752
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5753 void
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5754 setup_coding_system (coding_system, coding)
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
5755 Lisp_Object coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5756 struct coding_system *coding;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5757 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5758 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5759 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5760 Lisp_Object coding_type;
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
5761 Lisp_Object val;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5762
24460
be35d27a4bfb (setup_coding_system): Check for CODING_SYSTEM = nil.
Kenichi Handa <handa@m17n.org>
parents: 24425
diff changeset
5763 if (NILP (coding_system))
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
5764 coding_system = Qundecided;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5765
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5766 CHECK_CODING_SYSTEM_GET_ID (coding_system, coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5767
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5768 attrs = CODING_ID_ATTRS (coding->id);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
5769 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5770
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5771 coding->mode = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5772 coding->head_ascii = -1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
5773 if (VECTORP (eol_type))
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5774 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5775 | CODING_REQUIRE_DETECTION_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5776 else if (! EQ (eol_type, Qunix))
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5777 coding->common_flags = (CODING_REQUIRE_DECODING_MASK
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5778 | CODING_REQUIRE_ENCODING_MASK);
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5779 else
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
5780 coding->common_flags = 0;
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5781 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5782 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5783 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
5784 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5785 if (! NILP (CODING_ATTR_FOR_UNIBYTE (attrs)))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5786 coding->common_flags |= CODING_FOR_UNIBYTE_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5787
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5788 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5789 coding->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5790 coding->safe_charsets = SDATA (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5791 coding->default_char = XINT (CODING_ATTR_DEFAULT_CHAR (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5792
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5793 coding_type = CODING_ATTR_TYPE (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5794 if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5795 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5796 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5797 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5798 coding->encoder = encode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5799 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5800 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5801 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5802 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5803 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5804 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5805
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5806 /* Invoke graphic register 0 to plane 0. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5807 CODING_ISO_INVOCATION (coding, 0) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5808 /* Invoke graphic register 1 to plane 1 if we can use 8-bit. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5809 CODING_ISO_INVOCATION (coding, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5810 = (flags & CODING_ISO_FLAG_SEVEN_BITS ? -1 : 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5811 /* Setup the initial status of designation. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5812 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5813 CODING_ISO_DESIGNATION (coding, i) = CODING_ISO_INITIAL (coding, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5814 /* Not single shifting initially. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5815 CODING_ISO_SINGLE_SHIFTING (coding) = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5816 /* Beginning of buffer should also be regarded as bol. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5817 CODING_ISO_BOL (coding) = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5818 coding->detector = detect_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5819 coding->decoder = decode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5820 coding->encoder = encode_coding_iso_2022;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5821 if (flags & CODING_ISO_FLAG_SAFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5822 coding->mode |= CODING_MODE_SAFE_ENCODING;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5823 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5824 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5825 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5826 if (flags & CODING_ISO_FLAG_COMPOSITION)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5827 coding->common_flags |= CODING_ANNOTATE_COMPOSITION_MASK;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5828 if (flags & CODING_ISO_FLAG_DESIGNATION)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
5829 coding->common_flags |= CODING_ANNOTATE_CHARSET_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5830 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5831 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5832 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5833 val = CODING_ATTR_SAFE_CHARSETS (attrs);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5834 coding->max_charset_id = SCHARS (val) - 1;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5835 coding->safe_charsets = SDATA (val);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
5836 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5837 CODING_ISO_FLAGS (coding) = flags;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5838 CODING_ISO_CMP_STATUS (coding)->state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5839 CODING_ISO_CMP_STATUS (coding)->method = COMPOSITION_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5840 CODING_ISO_EXTSEGMENT_LEN (coding) = 0;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5841 CODING_ISO_EMBEDDED_UTF_8 (coding) = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5842 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5843 else if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5844 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5845 coding->detector = detect_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5846 coding->decoder = decode_coding_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5847 coding->encoder = encode_coding_charset;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5848 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5849 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5850 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5851 else if (EQ (coding_type, Qutf_8))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5852 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5853 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5854 CODING_UTF_8_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5855 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5856 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5857 coding->detector = detect_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5858 coding->decoder = decode_coding_utf_8;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5859 coding->encoder = encode_coding_utf_8;
34888
b469d29c0815 (SAFE_ONE_MORE_BYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34813
diff changeset
5860 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5861 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5862 if (CODING_UTF_8_BOM (coding) == utf_detect_bom)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5863 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5864 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5865 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5866 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5867 val = AREF (attrs, coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5868 CODING_UTF_16_BOM (coding) = (CONSP (val) ? utf_detect_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5869 : EQ (val, Qt) ? utf_with_bom
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5870 : utf_without_bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5871 val = AREF (attrs, coding_attr_utf_16_endian);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5872 CODING_UTF_16_ENDIAN (coding) = (EQ (val, Qbig) ? utf_16_big_endian
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5873 : utf_16_little_endian);
88438
3a34b722dd71 (encode_coding_utf_8): Initialize produced_chars to 0.
Kenichi Handa <handa@m17n.org>
parents: 88430
diff changeset
5874 CODING_UTF_16_SURROGATE (coding) = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5875 coding->detector = detect_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5876 coding->decoder = decode_coding_utf_16;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5877 coding->encoder = encode_coding_utf_16;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5878 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5879 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
5880 if (CODING_UTF_16_BOM (coding) == utf_detect_bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
5881 coding->common_flags |= CODING_REQUIRE_DETECTION_MASK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5882 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5883 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5884 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5885 coding->detector = detect_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5886 coding->decoder = decode_coding_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5887 coding->encoder = encode_coding_ccl;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5888 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5889 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5890 | CODING_REQUIRE_FLUSHING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5891 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5892 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5893 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5894 coding->detector = detect_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5895 coding->decoder = decode_coding_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5896 coding->encoder = encode_coding_emacs_mule;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5897 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5898 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5899 coding->spec.emacs_mule.full_support = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5900 if (! NILP (AREF (attrs, coding_attr_emacs_mule_full))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5901 && ! EQ (CODING_ATTR_CHARSET_LIST (attrs), Vemacs_mule_charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5902 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5903 Lisp_Object tail, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5904 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5905
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5906 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5907 tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5908 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5909 max_charset_id = XFASTINT (XCAR (tail));
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5910 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5911 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5912 for (tail = Vemacs_mule_charset_list; CONSP (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5913 tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
5914 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5915 coding->max_charset_id = max_charset_id;
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
5916 coding->safe_charsets = SDATA (safe_charsets);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5917 coding->spec.emacs_mule.full_support = 1;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5918 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5919 coding->spec.emacs_mule.cmp_status.state = COMPOSING_NO;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
5920 coding->spec.emacs_mule.cmp_status.method = COMPOSITION_NO;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5921 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5922 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5923 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5924 coding->detector = detect_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5925 coding->decoder = decode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5926 coding->encoder = encode_coding_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5927 coding->common_flags
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5928 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5929 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5930 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5931 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5932 coding->detector = detect_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5933 coding->decoder = decode_coding_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5934 coding->encoder = encode_coding_big5;
20227
71008f909642 (setup_coding_system): Initialize common_flags member
Kenichi Handa <handa@m17n.org>
parents: 20150
diff changeset
5935 coding->common_flags
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5936 |= (CODING_REQUIRE_DECODING_MASK | CODING_REQUIRE_ENCODING_MASK);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5937 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5938 else /* EQ (coding_type, Qraw_text) */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5939 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5940 coding->detector = NULL;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5941 coding->decoder = decode_coding_raw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5942 coding->encoder = encode_coding_raw_text;
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5943 if (! EQ (eol_type, Qunix))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5944 {
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5945 coding->common_flags |= CODING_REQUIRE_DECODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5946 if (! VECTORP (eol_type))
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5947 coding->common_flags |= CODING_REQUIRE_ENCODING_MASK;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5948 }
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
5949
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5950 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
5951
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5952 return;
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5953 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
5954
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5955 /* Return a list of charsets supported by CODING. */
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5956
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5957 Lisp_Object
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5958 coding_charset_list (coding)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5959 struct coding_system *coding;
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
5960 {
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
5961 Lisp_Object attrs, charset_list;
90061
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5962
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5963 CODING_GET_INFO (coding, attrs, charset_list);
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5964 if (EQ (CODING_ATTR_TYPE (attrs), Qiso_2022))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5965 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5966 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5967
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5968 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5969 charset_list = Viso_2022_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5970 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5971 else if (EQ (CODING_ATTR_TYPE (attrs), Qemacs_mule))
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5972 {
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5973 charset_list = Vemacs_mule_charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5974 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5975 return charset_list;
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5976 }
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5977
48210be97b12 Cancel the change done in HEAD on 2004-11-30.
Kenichi Handa <handa@m17n.org>
parents: 90054
diff changeset
5978
101776
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5979 /* Return a list of charsets supported by CODING-SYSTEM. */
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5980
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5981 Lisp_Object
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5982 coding_system_charset_list (coding_system)
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5983 Lisp_Object coding_system;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5984 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5985 int id;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5986 Lisp_Object attrs, charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5987
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5988 CHECK_CODING_SYSTEM_GET_ID (coding_system, id);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5989 attrs = CODING_ID_ATTRS (id);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5990
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5991 if (EQ (CODING_ATTR_TYPE (attrs), Qiso_2022))
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5992 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5993 int flags = XINT (AREF (attrs, coding_attr_iso_flags));
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5994
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5995 if (flags & CODING_ISO_FLAG_FULL_SUPPORT)
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5996 charset_list = Viso_2022_charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5997 else
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5998 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
5999 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6000 else if (EQ (CODING_ATTR_TYPE (attrs), Qemacs_mule))
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6001 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6002 charset_list = Vemacs_mule_charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6003 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6004 else
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6005 {
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6006 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6007 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6008 return charset_list;
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6009 }
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6010
11ba351ce12b (coding_system_charset_list): New function.
Kenichi Handa <handa@m17n.org>
parents: 101678
diff changeset
6011
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6012 /* Return raw-text or one of its subsidiaries that has the same
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6013 eol_type as CODING-SYSTEM. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6014
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6015 Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6016 raw_text_coding_system (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6017 Lisp_Object coding_system;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6018 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
6019 Lisp_Object spec, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6020 Lisp_Object eol_type, raw_text_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6021
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6022 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6023 return Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6024 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6025 attrs = AREF (spec, 0);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6026
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6027 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6028 return coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6029
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6030 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6031 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6032 return Qraw_text;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6033 spec = CODING_SYSTEM_SPEC (Qraw_text);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6034 raw_text_eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6035 return (EQ (eol_type, Qunix) ? AREF (raw_text_eol_type, 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6036 : EQ (eol_type, Qdos) ? AREF (raw_text_eol_type, 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6037 : AREF (raw_text_eol_type, 2));
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6038 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
6039
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6040
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6041 /* If CODING_SYSTEM doesn't specify end-of-line format but PARENT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6042 does, return one of the subsidiary that has the same eol-spec as
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6043 PARENT. Otherwise, return CODING_SYSTEM. If PARENT is nil,
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6044 inherit end-of-line format from the system's setting
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6045 (system_eol_type). */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6046
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6047 Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6048 coding_inherit_eol_type (coding_system, parent)
88473
b47ee8b1ce03 (coding_inherit_eol_type)
Dave Love <fx@gnu.org>
parents: 88465
diff changeset
6049 Lisp_Object coding_system, parent;
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6050 {
89545
4f394eed6ff2 (inhibit_pre_post_conversion): Removed (unused).
Dave Love <fx@gnu.org>
parents: 89519
diff changeset
6051 Lisp_Object spec, eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6052
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6053 if (NILP (coding_system))
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
6054 coding_system = Qraw_text;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6055 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6056 eol_type = AREF (spec, 2);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6057 if (VECTORP (eol_type))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6058 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6059 Lisp_Object parent_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6060
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6061 if (! NILP (parent))
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6062 {
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6063 Lisp_Object parent_spec;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6064
90587
fe721cfad011 (setup_coding_system): Fix setting of
Kenichi Handa <handa@m17n.org>
parents: 90573
diff changeset
6065 parent_spec = CODING_SYSTEM_SPEC (parent);
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6066 parent_eol_type = AREF (parent_spec, 2);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6067 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6068 else
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
6069 parent_eol_type = system_eol_type;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6070 if (EQ (parent_eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6071 coding_system = AREF (eol_type, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6072 else if (EQ (parent_eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6073 coding_system = AREF (eol_type, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6074 else if (EQ (parent_eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6075 coding_system = AREF (eol_type, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6076 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6077 return coding_system;
22616
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6078 }
c493ce6a31e4 (setup_raw_text_coding_system): New function.
Kenichi Handa <handa@m17n.org>
parents: 22529
diff changeset
6079
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6080 /* Emacs has a mechanism to automatically detect a coding system if it
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6081 is one of Emacs' internal format, ISO2022, SJIS, and BIG5. But,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6082 it's impossible to distinguish some coding systems accurately
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6083 because they use the same range of codes. So, at first, coding
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6084 systems are categorized into 7, those are:
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6085
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
6086 o coding-category-emacs-mule
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6087
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6088 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6089 as Emacs' internal format. Assigned the coding-system (Lisp
17835
f36ffb6f1208 Name change through the code:
Kenichi Handa <handa@m17n.org>
parents: 17725
diff changeset
6090 symbol) `emacs-mule' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6091
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6092 o coding-category-sjis
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6093
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6094 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6095 as SJIS. Assigned the coding-system (Lisp
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6096 symbol) `japanese-shift-jis' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6097
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6098 o coding-category-iso-7
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6099
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6100 The category for a coding system which has the same code range
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6101 as ISO2022 of 7-bit environment. This doesn't use any locking
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6102 shift and single shift functions. This can encode/decode all
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6103 charsets. Assigned the coding-system (Lisp symbol)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6104 `iso-2022-7bit' by default.
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6105
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6106 o coding-category-iso-7-tight
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6107
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6108 Same as coding-category-iso-7 except that this can
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6109 encode/decode only the specified charsets.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6110
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6111 o coding-category-iso-8-1
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6112
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6113 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6114 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6115 for DIMENSION1 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6116 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6117 symbol) `iso-latin-1' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6118
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6119 o coding-category-iso-8-2
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6120
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6121 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6122 as ISO2022 of 8-bit environment and graphic plane 1 used only
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6123 for DIMENSION2 charset. This doesn't use any locking shift
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6124 and single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6125 symbol) `japanese-iso-8bit' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6126
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6127 o coding-category-iso-7-else
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6128
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6129 The category for a coding system which has the same code range
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6130 as ISO2022 of 7-bit environemnt but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6131 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6132 symbol) `iso-2022-7bit-lock' by default.
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6133
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6134 o coding-category-iso-8-else
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6135
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6136 The category for a coding system which has the same code range
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6137 as ISO2022 of 8-bit environemnt but uses locking shift or
18787
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6138 single shift functions. Assigned the coding-system (Lisp
954e6be0a757 (detect_coding_iso2022): Distinguish coding-category-iso-7-else and
Kenichi Handa <handa@m17n.org>
parents: 18766
diff changeset
6139 symbol) `iso-2022-8bit-ss2' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6140
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6141 o coding-category-big5
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6142
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6143 The category for a coding system which has the same code range
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6144 as BIG5. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
6145 `cn-big5' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6146
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6147 o coding-category-utf-8
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6148
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6149 The category for a coding system which has the same code range
54303
5256a4b9366f UTF-8 is now RFC3629.
Eli Zaretskii <eliz@gnu.org>
parents: 53775
diff changeset
6150 as UTF-8 (cf. RFC3629). Assigned the coding-system (Lisp
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6151 symbol) `utf-8' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6152
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6153 o coding-category-utf-16-be
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6154
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6155 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6156 Unicode signature (cf. Unicode Standard) in the order of BIG
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6157 endian at the head. Assigned the coding-system (Lisp symbol)
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6158 `utf-16-be' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6159
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6160 o coding-category-utf-16-le
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6161
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6162 The category for a coding system in which a text has an
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6163 Unicode signature (cf. Unicode Standard) in the order of
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6164 LITTLE endian at the head. Assigned the coding-system (Lisp
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6165 symbol) `utf-16-le' by default.
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6166
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6167 o coding-category-ccl
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6168
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6169 The category for a coding system of which encoder/decoder is
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6170 written in CCL programs. The default value is nil, i.e., no
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6171 coding system is assigned.
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
6172
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6173 o coding-category-binary
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6174
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6175 The category for a coding system not categorized in any of the
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6176 above. Assigned the coding-system (Lisp symbol)
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
6177 `no-conversion' by default.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6178
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6179 Each of them is a Lisp symbol and the value is an actual
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6180 `coding-system's (this is also a Lisp symbol) assigned by a user.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6181 What Emacs does actually is to detect a category of coding system.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6182 Then, it uses a `coding-system' assigned to it. If Emacs can't
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6183 decide only one possible category, it selects a category of the
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6184 highest priority. Priorities of categories are also specified by a
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6185 user in a Lisp variable `coding-category-list'.
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6186
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6187 */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6188
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6189 #define EOL_SEEN_NONE 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6190 #define EOL_SEEN_LF 1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6191 #define EOL_SEEN_CR 2
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6192 #define EOL_SEEN_CRLF 4
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6193
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6194 /* Detect how end-of-line of a text of length SRC_BYTES pointed by
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6195 SOURCE is encoded. If CATEGORY is one of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6196 coding_category_utf_16_XXXX, assume that CR and LF are encoded by
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6197 two-byte, else they are encoded by one-byte.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6198
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6199 Return one of EOL_SEEN_XXX. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6200
19173
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
6201 #define MAX_EOL_CHECK_COUNT 3
04ed7c3f5cee (detect_eol_type): If EOL representation does not
Richard M. Stallman <rms@gnu.org>
parents: 19134
diff changeset
6202
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6203 static int
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6204 detect_eol (source, src_bytes, category)
84646
922a7e3b7383 (detect_eol_type, detect_eol_type_in_2_octet_form):
Michaël Cadilhac <michael.cadilhac@lrde.org>
parents: 83648
diff changeset
6205 const unsigned char *source;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6206 EMACS_INT src_bytes;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6207 enum coding_category category;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6208 {
84646
922a7e3b7383 (detect_eol_type, detect_eol_type_in_2_octet_form):
Michaël Cadilhac <michael.cadilhac@lrde.org>
parents: 83648
diff changeset
6209 const unsigned char *src = source, *src_end = src + src_bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6210 unsigned char c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6211 int total = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6212 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6213
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6214 if ((1 << category) & CATEGORY_MASK_UTF_16)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6215 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6216 int msb, lsb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6217
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6218 msb = category == (coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
6219 | coding_category_utf_16_le_nosig);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6220 lsb = 1 - msb;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6221
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6222 while (src + 1 < src_end)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6223 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6224 c = src[lsb];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6225 if (src[msb] == 0 && (c == '\n' || c == '\r'))
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6226 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6227 int this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6228
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6229 if (c == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6230 this_eol = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6231 else if (src + 3 >= src_end
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6232 || src[msb + 2] != 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6233 || src[lsb + 2] != '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6234 this_eol = EOL_SEEN_CR;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6235 else
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6236 {
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6237 this_eol = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6238 src += 2;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6239 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6240
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6241 if (eol_seen == EOL_SEEN_NONE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6242 /* This is the first end-of-line. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6243 eol_seen = this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6244 else if (eol_seen != this_eol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6245 {
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6246 /* The found type is different from what found before.
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6247 Allow for stray ^M characters in DOS EOL files. */
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6248 if (eol_seen == EOL_SEEN_CR && this_eol == EOL_SEEN_CRLF
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6249 || eol_seen == EOL_SEEN_CRLF && this_eol == EOL_SEEN_CR)
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6250 eol_seen = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6251 else
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6252 {
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6253 eol_seen = EOL_SEEN_LF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6254 break;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6255 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6256 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6257 if (++total == MAX_EOL_CHECK_COUNT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6258 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6259 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6260 src += 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6261 }
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6262 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6263 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6264 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6265 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6266 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6267 c = *src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6268 if (c == '\n' || c == '\r')
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6269 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6270 int this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6271
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6272 if (c == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6273 this_eol = EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6274 else if (src >= src_end || *src != '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6275 this_eol = EOL_SEEN_CR;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6276 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6277 this_eol = EOL_SEEN_CRLF, src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6278
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6279 if (eol_seen == EOL_SEEN_NONE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6280 /* This is the first end-of-line. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6281 eol_seen = this_eol;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6282 else if (eol_seen != this_eol)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6283 {
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6284 /* The found type is different from what found before.
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6285 Allow for stray ^M characters in DOS EOL files. */
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6286 if (eol_seen == EOL_SEEN_CR && this_eol == EOL_SEEN_CRLF
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6287 || eol_seen == EOL_SEEN_CRLF && this_eol == EOL_SEEN_CR)
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6288 eol_seen = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6289 else
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6290 {
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6291 eol_seen = EOL_SEEN_LF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6292 break;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6293 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6294 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6295 if (++total == MAX_EOL_CHECK_COUNT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6296 break;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6297 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6298 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6299 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6300 return eol_seen;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6301 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6302
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6303
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6304 static Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6305 adjust_coding_eol_type (coding, eol_seen)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6306 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6307 int eol_seen;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6308 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
6309 Lisp_Object eol_type;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6310
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6311 eol_type = CODING_ID_EOL_TYPE (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6312 if (eol_seen & EOL_SEEN_LF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6313 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6314 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 0));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6315 eol_type = Qunix;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6316 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
6317 else if (eol_seen & EOL_SEEN_CRLF)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6318 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6319 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 1));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6320 eol_type = Qdos;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6321 }
88862
108e2535280d (adjust_coding_eol_type): Fix eol_type/eol_seen mixup.
Dave Love <fx@gnu.org>
parents: 88856
diff changeset
6322 else if (eol_seen & EOL_SEEN_CR)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6323 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6324 coding->id = CODING_SYSTEM_ID (AREF (eol_type, 2));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6325 eol_type = Qmac;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6326 }
19181
917138730635 (detect_eol_type): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 19173
diff changeset
6327 return eol_type;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6328 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6329
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6330 /* Detect how a text specified in CODING is encoded. If a coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6331 system is detected, update fields of CODING by the detected coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6332 system. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6333
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6334 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6335 detect_coding (coding)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6336 struct coding_system *coding;
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6337 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6338 const unsigned char *src, *src_end;
102105
a5023e8bbb1e (detect_coding): Preserve coding->mode.
Kenichi Handa <handa@m17n.org>
parents: 102058
diff changeset
6339 int saved_mode = coding->mode;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6340
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6341 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6342 coding->produced = coding->produced_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6343 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6344
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6345 src_end = coding->source + coding->src_bytes;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6346 coding->head_ascii = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6347
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6348 /* If we have not yet decided the text encoding type, detect it
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6349 now. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6350 if (EQ (CODING_ATTR_TYPE (CODING_ID_ATTRS (coding->id)), Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6351 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6352 int c, i;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6353 struct coding_detection_info detect_info;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6354 int null_byte_found = 0, eight_bit_found = 0;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6355
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6356 detect_info.checked = detect_info.found = detect_info.rejected = 0;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6357 for (src = coding->source; src < src_end; src++)
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6358 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6359 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6360 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6361 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6362 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6363 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6364 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6365 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6366 else if (c < 0x20)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6367 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6368 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6369 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6370 && ! detect_info.checked)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6371 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6372 if (detect_coding_iso_2022 (coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6373 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6374 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6375 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6376 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6377 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6378 have found a null-byte, but it's very
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6379 rare that a binary file confirm to
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6380 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6381 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6382 coding->head_ascii = src - coding->source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6383 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6384 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6385 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6386 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6387 }
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
6388 else if (! c && !inhibit_null_byte_detection)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6389 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6390 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6391 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6392 break;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6393 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6394 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6395 coding->head_ascii++;
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6396 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
6397 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6398 coding->head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6399 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6400
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6401 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6402 || coding->head_ascii < coding->src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6403 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6404 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6405 enum coding_category category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6406 struct coding_system *this;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6407
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6408 if (coding->head_ascii == coding->src_bytes)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6409 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6410 for (i = 0; i < coding_category_raw_text; i++)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6411 {
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6412 category = coding_priorities[i];
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6413 this = coding_categories + category;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6414 if (detect_info.found & (1 << category))
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6415 break;
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6416 }
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6417 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6418 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6419 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6420 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6421 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6422 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6423 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6424 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6425 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6426 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6427 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6428 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6429 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6430 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6431 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6432 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6433 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6434 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6435 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6436 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6437 if (detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6438 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6439 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6440 else if ((*(this->detector)) (coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6441 && detect_info.found & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6442 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6443 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6444 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6445 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6446 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6447 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6448 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6449 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
6450 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6451 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6452 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
6453 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6454
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6455 if (i < coding_category_raw_text)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6456 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6457 else if (null_byte_found)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6458 setup_coding_system (Qno_conversion, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6459 else if ((detect_info.rejected & CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6460 == CATEGORY_MASK_ANY)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6461 setup_coding_system (Qraw_text, coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6462 else if (detect_info.rejected)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6463 for (i = 0; i < coding_category_raw_text; i++)
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6464 if (! (detect_info.rejected & (1 << coding_priorities[i])))
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6465 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6466 this = coding_categories + coding_priorities[i];
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6467 setup_coding_system (CODING_ID_NAME (this->id), coding);
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6468 break;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
6469 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6470 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6471 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6472 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6473 == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6474 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6475 Lisp_Object coding_systems;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6476 struct coding_detection_info detect_info;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6477
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6478 coding_systems
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6479 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6480 detect_info.found = detect_info.rejected = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6481 coding->head_ascii = 0;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6482 if (CONSP (coding_systems)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6483 && detect_coding_utf_8 (coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6484 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6485 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6486 setup_coding_system (XCAR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6487 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6488 setup_coding_system (XCDR (coding_systems), coding);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6489 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6490 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6491 else if (XINT (CODING_ATTR_CATEGORY (CODING_ID_ATTRS (coding->id)))
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6492 == coding_category_utf_16_auto)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6493 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6494 Lisp_Object coding_systems;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6495 struct coding_detection_info detect_info;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6496
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6497 coding_systems
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6498 = AREF (CODING_ID_ATTRS (coding->id), coding_attr_utf_bom);
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6499 detect_info.found = detect_info.rejected = 0;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
6500 coding->head_ascii = 0;
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6501 if (CONSP (coding_systems)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6502 && detect_coding_utf_16 (coding, &detect_info))
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6503 {
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6504 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6505 setup_coding_system (XCAR (coding_systems), coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6506 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6507 setup_coding_system (XCDR (coding_systems), coding);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6508 }
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
6509 }
102105
a5023e8bbb1e (detect_coding): Preserve coding->mode.
Kenichi Handa <handa@m17n.org>
parents: 102058
diff changeset
6510 coding->mode = saved_mode;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6511 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6512
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6513
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6514 static void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6515 decode_eol (coding)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6516 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6517 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6518 Lisp_Object eol_type;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6519 unsigned char *p, *pbeg, *pend;
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
6520
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6521 eol_type = CODING_ID_EOL_TYPE (coding->id);
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
6522 if (EQ (eol_type, Qunix) || inhibit_eol_conversion)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6523 return;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6524
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6525 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6526 pbeg = coding->destination;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6527 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6528 pbeg = BYTE_POS_ADDR (coding->dst_pos_byte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6529 pend = pbeg + coding->produced;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6530
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6531 if (VECTORP (eol_type))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6532 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6533 int eol_seen = EOL_SEEN_NONE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6534
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6535 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6536 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6537 if (*p == '\n')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6538 eol_seen |= EOL_SEEN_LF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6539 else if (*p == '\r')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6540 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6541 if (p + 1 < pend && *(p + 1) == '\n')
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6542 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6543 eol_seen |= EOL_SEEN_CRLF;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6544 p++;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6545 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6546 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6547 eol_seen |= EOL_SEEN_CR;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
6548 }
28022
6c41f3276340 Add comments on coding-category-utf-8,
Kenichi Handa <handa@m17n.org>
parents: 27943
diff changeset
6549 }
101678
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6550 /* Handle DOS-style EOLs in a file with stray ^M characters. */
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6551 if ((eol_seen & EOL_SEEN_CRLF) != 0
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6552 && (eol_seen & EOL_SEEN_CR) != 0
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6553 && (eol_seen & EOL_SEEN_LF) == 0)
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6554 eol_seen = EOL_SEEN_CRLF;
589af07b7af1 (detect_eol, decode_eol): Handle text with DOS-style EOLs that also has
Eli Zaretskii <eliz@gnu.org>
parents: 101197
diff changeset
6555 else if (eol_seen != EOL_SEEN_NONE
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6556 && eol_seen != EOL_SEEN_LF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6557 && eol_seen != EOL_SEEN_CRLF
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6558 && eol_seen != EOL_SEEN_CR)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6559 eol_seen = EOL_SEEN_LF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6560 if (eol_seen != EOL_SEEN_NONE)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6561 eol_type = adjust_coding_eol_type (coding, eol_seen);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6562 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6563
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6564 if (EQ (eol_type, Qmac))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6565 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6566 for (p = pbeg; p < pend; p++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6567 if (*p == '\r')
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6568 *p = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6569 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6570 else if (EQ (eol_type, Qdos))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6571 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6572 int n = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6573
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6574 if (NILP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6575 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6576 /* Start deleting '\r' from the tail to minimize the memory
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6577 movement. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6578 for (p = pend - 2; p >= pbeg; p--)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6579 if (*p == '\r')
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6580 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6581 safe_bcopy ((char *) (p + 1), (char *) p, pend-- - p - 1);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6582 n++;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6583 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6584 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6585 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6586 {
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6587 int pos_byte = coding->dst_pos_byte;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6588 int pos = coding->dst_pos;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6589 int pos_end = pos + coding->produced_char - 1;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6590
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6591 while (pos < pos_end)
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6592 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6593 p = BYTE_POS_ADDR (pos_byte);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6594 if (*p == '\r' && p[1] == '\n')
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6595 {
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6596 del_range_2 (pos, pos_byte, pos + 1, pos_byte + 1, 0);
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6597 n++;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6598 pos_end--;
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6599 }
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6600 pos++;
91535
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6601 if (coding->dst_multibyte)
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6602 pos_byte += BYTES_BY_CHAR_HEAD (*p);
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6603 else
419a669bc4f2 (decode_eol): Pay attention to coding->dst_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 91367
diff changeset
6604 pos_byte++;
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
6605 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6606 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6607 coding->produced -= n;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
6608 coding->produced_char -= n;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6609 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6610 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6611
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6612
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6613 /* Return a translation table (or list of them) from coding system
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6614 attribute vector ATTRS for encoding (ENCODEP is nonzero) or
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6615 decoding (ENCODEP is zero). */
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6616
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6617 static Lisp_Object
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6618 get_translation_table (attrs, encodep, max_lookup)
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6619 Lisp_Object attrs;
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6620 int encodep, *max_lookup;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6621 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6622 Lisp_Object standard, translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6623 Lisp_Object val;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6624
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6625 if (encodep)
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6626 translation_table = CODING_ATTR_ENCODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6627 standard = Vstandard_translation_table_for_encode;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6628 else
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6629 translation_table = CODING_ATTR_DECODE_TBL (attrs),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6630 standard = Vstandard_translation_table_for_decode;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6631 if (NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6632 translation_table = standard;
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6633 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6634 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6635 if (SYMBOLP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6636 translation_table = Fget (translation_table, Qtranslation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6637 else if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6638 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6639 translation_table = Fcopy_sequence (translation_table);
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6640 for (val = translation_table; CONSP (val); val = XCDR (val))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6641 if (SYMBOLP (XCAR (val)))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6642 XSETCAR (val, Fget (XCAR (val), Qtranslation_table));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6643 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6644 if (CHAR_TABLE_P (standard))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6645 {
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6646 if (CONSP (translation_table))
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6647 translation_table = nconc2 (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6648 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6649 else
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6650 translation_table = Fcons (translation_table,
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6651 Fcons (standard, Qnil));
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6652 }
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6653 }
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6654
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6655 if (max_lookup)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6656 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6657 *max_lookup = 1;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6658 if (CHAR_TABLE_P (translation_table)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6659 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (translation_table)) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6660 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6661 val = XCHAR_TABLE (translation_table)->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6662 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6663 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6664 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6665 else if (CONSP (translation_table))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6666 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6667 Lisp_Object tail, val;
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6668
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6669 for (tail = translation_table; CONSP (tail); tail = XCDR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6670 if (CHAR_TABLE_P (XCAR (tail))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6671 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (XCAR (tail))) > 1)
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6672 {
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6673 val = XCHAR_TABLE (XCAR (tail))->extras[1];
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6674 if (NATNUMP (val) && *max_lookup < XFASTINT (val))
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6675 *max_lookup = XFASTINT (val);
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6676 }
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
6677 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
6678 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6679 return translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6680 }
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6681
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6682 #define LOOKUP_TRANSLATION_TABLE(table, c, trans) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6683 do { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6684 trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6685 if (CHAR_TABLE_P (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6686 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6687 trans = CHAR_TABLE_REF (table, c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6688 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6689 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6690 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6691 else if (CONSP (table)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6692 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6693 Lisp_Object tail; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6694 \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6695 for (tail = table; CONSP (tail); tail = XCDR (tail)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6696 if (CHAR_TABLE_P (XCAR (tail))) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6697 { \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6698 trans = CHAR_TABLE_REF (XCAR (tail), c); \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6699 if (CHARACTERP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6700 c = XFASTINT (trans), trans = Qnil; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6701 else if (! NILP (trans)) \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6702 break; \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6703 } \
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6704 } \
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6705 } while (0)
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6706
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
6707
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6708 /* Return a translation of character(s) at BUF according to TRANS.
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6709 TRANS is TO-CHAR or ((FROM . TO) ...) where
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6710 FROM = [FROM-CHAR ...], TO is TO-CHAR or [TO-CHAR ...].
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6711 The return value is TO-CHAR or ([FROM-CHAR ...] . TO) if a
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6712 translation is found, and Qnil if not found..
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6713 If BUF is too short to lookup characters in FROM, return Qt. */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6714
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6715 static Lisp_Object
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6716 get_translation (trans, buf, buf_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6717 Lisp_Object trans;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6718 int *buf, *buf_end;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6719 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6720
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6721 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6722 return trans;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6723 for (; CONSP (trans); trans = XCDR (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6724 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6725 Lisp_Object val = XCAR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6726 Lisp_Object from = XCAR (val);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6727 int len = ASIZE (from);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6728 int i;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6729
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6730 for (i = 0; i < len; i++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6731 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6732 if (buf + i == buf_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6733 return Qt;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6734 if (XINT (AREF (from, i)) != buf[i])
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6735 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6736 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6737 if (i == len)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6738 return val;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6739 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6740 return Qnil;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6741 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6742
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6743
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6744 static int
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6745 produce_chars (coding, translation_table, last_block)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6746 struct coding_system *coding;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6747 Lisp_Object translation_table;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6748 int last_block;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
6749 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6750 unsigned char *dst = coding->destination + coding->produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6751 unsigned char *dst_end = coding->destination + coding->dst_bytes;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6752 EMACS_INT produced;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6753 EMACS_INT produced_chars = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6754 int carryover = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6755
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6756 if (! coding->chars_at_source)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6757 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6758 /* Source characters are in coding->charbuf. */
89575
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6759 int *buf = coding->charbuf;
59d10ebd2a0b (produce_chars): Revert last change.
Andreas Schwab <schwab@suse.de>
parents: 89571
diff changeset
6760 int *buf_end = buf + coding->charbuf_used;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6761
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6762 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6763 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6764 coding_set_source (coding);
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6765 dst_end = ((unsigned char *) coding->source) + coding->consumed;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6766 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6767
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6768 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6769 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6770 int c = *buf, i;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6771
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6772 if (c >= 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6773 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6774 int from_nchars = 1, to_nchars = 1;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6775 Lisp_Object trans = Qnil;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6776
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
6777 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
6778 if (! NILP (trans))
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6779 {
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6780 trans = get_translation (trans, buf, buf_end);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6781 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6782 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6783 else if (CONSP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6784 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6785 from_nchars = ASIZE (XCAR (trans));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6786 trans = XCDR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6787 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6788 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6789 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6790 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6791 to_nchars = ASIZE (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6792 c = XINT (AREF (trans, 0));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6793 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6794 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6795 else if (EQ (trans, Qt) && ! last_block)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6796 break;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6797 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6798
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6799 if (dst + MAX_MULTIBYTE_LENGTH * to_nchars > dst_end)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6800 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6801 dst = alloc_destination (coding,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6802 buf_end - buf
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6803 + MAX_MULTIBYTE_LENGTH * to_nchars,
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6804 dst);
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6805 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6806 {
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6807 coding_set_source (coding);
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6808 dst_end = (((unsigned char *) coding->source)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6809 + coding->consumed);
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6810 }
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6811 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6812 dst_end = coding->destination + coding->dst_bytes;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6813 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6814
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6815 for (i = 0; i < to_nchars; i++)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6816 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6817 if (i > 0)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
6818 c = XINT (AREF (trans, i));
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6819 if (coding->dst_multibyte
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6820 || ! CHAR_BYTE8_P (c))
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6821 CHAR_STRING_ADVANCE_NO_UNIFY (c, dst);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6822 else
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6823 *dst++ = CHAR_TO_BYTE8 (c);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6824 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6825 produced_chars += to_nchars;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6826 buf += from_nchars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6827 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6828 else
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6829 /* This is an annotation datum. (-C) is the length. */
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6830 buf += -c;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6831 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6832 carryover = buf_end - buf;
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6833 }
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6834 else
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
6835 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6836 /* Source characters are at coding->source. */
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6837 const unsigned char *src = coding->source;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6838 const unsigned char *src_end = src + coding->consumed;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6839
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6840 if (EQ (coding->dst_object, coding->src_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6841 dst_end = (unsigned char *) src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6842 if (coding->src_multibyte != coding->dst_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6843 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6844 if (coding->src_multibyte)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6845 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6846 int multibytep = 1;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
6847 EMACS_INT consumed_chars = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6848
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6849 while (1)
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6850 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6851 const unsigned char *src_base = src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6852 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6853
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6854 ONE_MORE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6855 if (dst == dst_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6856 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6857 if (EQ (coding->src_object, coding->dst_object))
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6858 dst_end = (unsigned char *) src;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6859 if (dst == dst_end)
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6860 {
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6861 EMACS_INT offset = src - coding->source;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6862
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6863 dst = alloc_destination (coding, src_end - src + 1,
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6864 dst);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6865 dst_end = coding->destination + coding->dst_bytes;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6866 coding_set_source (coding);
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6867 src = coding->source + offset;
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6868 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6869 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6870 dst_end = (unsigned char *) src;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6871 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6872 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6873 *dst++ = c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6874 produced_chars++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6875 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6876 no_more_source:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6877 ;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6878 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6879 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6880 while (src < src_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6881 {
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
6882 int multibytep = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6883 int c = *src++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6884
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6885 if (dst >= dst_end - 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6886 {
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6887 if (EQ (coding->src_object, coding->dst_object))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
6888 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6889 if (dst >= dst_end - 1)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6890 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6891 EMACS_INT offset = src - coding->source;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6892 EMACS_INT more_bytes;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6893
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6894 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6895 more_bytes = ((src_end - src) / 2) + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6896 else
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6897 more_bytes = src_end - src + 2;
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6898 dst = alloc_destination (coding, more_bytes, dst);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6899 dst_end = coding->destination + coding->dst_bytes;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6900 coding_set_source (coding);
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6901 src = coding->source + offset;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6902 src_end = coding->source + coding->src_bytes;
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6903 if (EQ (coding->src_object, coding->dst_object))
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
6904 dst_end = (unsigned char *) src;
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
6905 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6906 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6907 EMIT_ONE_BYTE (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6908 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6909 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6910 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6911 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6912 if (!EQ (coding->src_object, coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6913 {
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6914 EMACS_INT require = coding->src_bytes - coding->dst_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6915
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6916 if (require > 0)
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6917 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6918 EMACS_INT offset = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6919
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6920 dst = alloc_destination (coding, require, dst);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6921 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6922 src = coding->source + offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6923 src_end = coding->source + coding->src_bytes;
23325
bbd06336cd0c (check_composing_code): If the current composing
Kenichi Handa <handa@m17n.org>
parents: 23315
diff changeset
6924 }
34892
3868f2e7355a (setup_coding_system): Initialize
Kenichi Handa <handa@m17n.org>
parents: 34888
diff changeset
6925 }
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6926 produced_chars = coding->consumed_char;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6927 while (src < src_end)
92406
c36bda0a03cc (decode_coding_big5, produce_chars): Fix typos in last
Andreas Schwab <schwab@suse.de>
parents: 92399
diff changeset
6928 *dst++ = *src++;
92399
fbc07b3a6baf (decode_coding_utf_8): When eol-type of CODING is
Kenichi Handa <handa@m17n.org>
parents: 92030
diff changeset
6929 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6930 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6931
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6932 produced = dst - (coding->destination + coding->produced);
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
6933 if (BUFFERP (coding->dst_object) && produced_chars > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6934 insert_from_gap (produced_chars, produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6935 coding->produced += produced;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6936 coding->produced_char += produced_chars;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6937 return carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6938 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6939
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6940 /* Compose text in CODING->object according to the annotation data at
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6941 CHARBUF. CHARBUF is an array:
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6942 [ -LENGTH ANNOTATION_MASK NCHARS NBYTES METHOD [ COMPONENTS... ] ]
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6943 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6944
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6945 static INLINE void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6946 produce_composition (coding, charbuf, pos)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6947 struct coding_system *coding;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6948 int *charbuf;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6949 EMACS_INT pos;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6950 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6951 int len;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6952 EMACS_INT to;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6953 enum composition_method method;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6954 Lisp_Object components;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6955
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6956 len = -charbuf[0] - MAX_ANNOTATION_LENGTH;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6957 to = pos + charbuf[2];
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6958 method = (enum composition_method) (charbuf[4]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6959
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6960 if (method == COMPOSITION_RELATIVE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6961 components = Qnil;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6962 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6963 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
6964 Lisp_Object args[MAX_COMPOSITION_COMPONENTS * 2 - 1];
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6965 int i, j;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6966
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6967 if (method == COMPOSITION_WITH_RULE)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6968 len = charbuf[2] * 3 - 2;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6969 charbuf += MAX_ANNOTATION_LENGTH;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6970 /* charbuf = [ CHRA ... CHAR] or [ CHAR -2 RULE ... CHAR ] */
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6971 for (i = j = 0; i < len && charbuf[i] != -1; i++, j++)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6972 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6973 if (charbuf[i] >= 0)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6974 args[j] = make_number (charbuf[i]);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6975 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6976 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6977 i++;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6978 args[j] = make_number (charbuf[i] % 0x100);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6979 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6980 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6981 components = (i == j ? Fstring (j, args) : Fvector (j, args));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
6982 }
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6983 compose_text (pos, to, components, Qnil, coding->dst_object);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6984 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
6985
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6986
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6987 /* Put `charset' property on text in CODING->object according to
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6988 the annotation data at CHARBUF. CHARBUF is an array:
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6989 [ -LENGTH ANNOTATION_MASK NCHARS CHARSET-ID ]
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6990 */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6991
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6992 static INLINE void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6993 produce_charset (coding, charbuf, pos)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6994 struct coding_system *coding;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
6995 int *charbuf;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6996 EMACS_INT pos;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6997 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6998 EMACS_INT from = pos - charbuf[2];
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
6999 struct charset *charset = CHARSET_FROM_ID (charbuf[3]);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7000
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7001 Fput_text_property (make_number (from), make_number (pos),
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7002 Qcharset, CHARSET_NAME (charset),
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7003 coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7004 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7005
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7006
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7007 #define CHARBUF_SIZE 0x4000
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7008
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7009 #define ALLOC_CONVERSION_WORK_AREA(coding) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7010 do { \
101943
97c9e9322753 Remove spurious semicolons.
Juanma Barranquero <lekktu@gmail.com>
parents: 101904
diff changeset
7011 int size = CHARBUF_SIZE; \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7012 \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7013 coding->charbuf = NULL; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7014 while (size > 1024) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7015 { \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7016 coding->charbuf = (int *) alloca (sizeof (int) * size); \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7017 if (coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7018 break; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7019 size >>= 1; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7020 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7021 if (! coding->charbuf) \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7022 { \
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7023 record_conversion_result (coding, CODING_RESULT_INSUFFICIENT_MEM); \
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7024 return coding->result; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7025 } \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7026 coding->charbuf_size = size; \
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7027 } while (0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7028
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7029
30833
2db6e42a6ba3 (MINIMUM_CONVERSION_BUFFER_SIZE): Macro deleted.
Kenichi Handa <handa@m17n.org>
parents: 30756
diff changeset
7030 static void
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7031 produce_annotation (coding, pos)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7032 struct coding_system *coding;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7033 EMACS_INT pos;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7034 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7035 int *charbuf = coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7036 int *charbuf_end = charbuf + coding->charbuf_used;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7037
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7038 if (NILP (coding->dst_object))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7039 return;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7040
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7041 while (charbuf < charbuf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7042 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7043 if (*charbuf >= 0)
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7044 pos++, charbuf++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7045 else
29877
7b43e1fb478a (decode_eol_post_ccl): Special handling for undecided
Eli Zaretskii <eliz@gnu.org>
parents: 29725
diff changeset
7046 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7047 int len = -*charbuf;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7048
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7049 if (len > 2)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7050 switch (charbuf[1])
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7051 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7052 case CODING_ANNOTATE_COMPOSITION_MASK:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7053 produce_composition (coding, charbuf, pos);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7054 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7055 case CODING_ANNOTATE_CHARSET_MASK:
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7056 produce_charset (coding, charbuf, pos);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7057 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7058 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7059 charbuf += len;
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7060 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7061 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7062 }
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7063
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7064 /* Decode the data at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7065 CODING->src_object is a buffer, a string, or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7066 CODING->dst_object is a buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7067
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7068 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7069 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7070 the source text in the buffer, otherwise, the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7071 gap area of the buffer, and CODING->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7072 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7073 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7074 negative.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7075
90380
4bf7966e0788 (decode_coding): Typo in comment fixed.
Kenichi Handa <handa@m17n.org>
parents: 90378
diff changeset
7076 If CODING->src_object is a string, CODING->src_pos is an index to
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7077 that string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7078
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7079 If CODING->src_object is nil, CODING->source must already point to
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7080 the non-relocatable memory area. In this case, CODING->src_pos is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7081 an offset from CODING->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7082
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7083 The decoded data is inserted at the current point of the buffer
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7084 CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7085 */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7086
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7087 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7088 decode_coding (coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7089 struct coding_system *coding;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7090 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7091 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7092 Lisp_Object undo_list;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
7093 Lisp_Object translation_table;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7094 int carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7095 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7096
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7097 if (BUFFERP (coding->src_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7098 && coding->src_pos > 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7099 && coding->src_pos < GPT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7100 && coding->src_pos + coding->src_chars > GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7101 move_gap_both (coding->src_pos, coding->src_pos_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7102
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7103 undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7104 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7105 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7106 if (current_buffer != XBUFFER (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7107 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7108 if (GPT != PT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7109 move_gap_both (PT, PT_BYTE);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7110 undo_list = current_buffer->undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7111 current_buffer->undo_list = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7112 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7113
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7114 coding->consumed = coding->consumed_char = 0;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7115 coding->produced = coding->produced_char = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7116 coding->chars_at_source = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7117 record_conversion_result (coding, CODING_RESULT_SUCCESS);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7118 coding->errors = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7119
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7120 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7121
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7122 attrs = CODING_ID_ATTRS (coding->id);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
7123 translation_table = get_translation_table (attrs, 0, NULL);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7124
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7125 carryover = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7126 do
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7127 {
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7128 EMACS_INT pos = coding->dst_pos + coding->produced_char;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7129
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7130 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7131 coding->annotated = 0;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7132 coding->charbuf_used = carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7133 (*(coding->decoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7134 coding_set_destination (coding);
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7135 carryover = produce_chars (coding, translation_table, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7136 if (coding->annotated)
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7137 produce_annotation (coding, pos);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7138 for (i = 0; i < carryover; i++)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7139 coding->charbuf[i]
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7140 = coding->charbuf[coding->charbuf_used - carryover + i];
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7141 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7142 while (coding->consumed < coding->src_bytes
90336
f0338dbf2276 (decode_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 90327
diff changeset
7143 && (coding->result == CODING_RESULT_SUCCESS
f0338dbf2276 (decode_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 90327
diff changeset
7144 || coding->result == CODING_RESULT_INVALID_SRC));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7145
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7146 if (carryover > 0)
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7147 {
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7148 coding_set_destination (coding);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7149 coding->charbuf_used = carryover;
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7150 produce_chars (coding, translation_table, 1);
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7151 }
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7152
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7153 coding->carryover_bytes = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7154 if (coding->consumed < coding->src_bytes)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7155 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7156 int nbytes = coding->src_bytes - coding->consumed;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7157 const unsigned char *src;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7158
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7159 coding_set_source (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7160 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7161 src = coding->source + coding->consumed;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7162
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7163 if (coding->mode & CODING_MODE_LAST_BLOCK)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7164 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7165 /* Flush out unprocessed data as binary chars. We are sure
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7166 that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7167 coding->charbuf. */
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7168 coding->charbuf_used = 0;
100587
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
7169 coding->chars_at_source = 0;
d91e3320dd81 (decode_coding): Clear chars_at_source flag when using charbuf.
Jason Rumney <jasonr@gnu.org>
parents: 100303
diff changeset
7170
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7171 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7172 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7173 int c = *src++;
89279
1fd77c471ee6 (decode_coding_utf_8): When eol_type is Qdos, handle
Kenichi Handa <handa@m17n.org>
parents: 89227
diff changeset
7174
90243
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7175 if (c & 0x80)
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7176 c = BYTE8_TO_CHAR (c);
c59afb15f5c6 (decode_coding): Fix handling of invalid bytes.
Kenichi Handa <handa@m17n.org>
parents: 90231
diff changeset
7177 coding->charbuf[coding->charbuf_used++] = c;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7178 }
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7179 produce_chars (coding, Qnil, 1);
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7180 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7181 else
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7182 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7183 /* Record unprocessed bytes in coding->carryover. We are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7184 sure that the number of data is less than the size of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7185 coding->carryover. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7186 unsigned char *p = coding->carryover;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7187
102115
db1f94e25359 (detect_coding): Don't overflow coding->carryover.
Kenichi Handa <handa@m17n.org>
parents: 102105
diff changeset
7188 if (nbytes > sizeof coding->carryover)
db1f94e25359 (detect_coding): Don't overflow coding->carryover.
Kenichi Handa <handa@m17n.org>
parents: 102105
diff changeset
7189 nbytes = sizeof coding->carryover;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7190 coding->carryover_bytes = nbytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7191 while (nbytes-- > 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7192 *p++ = *src++;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7193 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7194 coding->consumed = coding->src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7195 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7196
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7197 if (! EQ (CODING_ID_EOL_TYPE (coding->id), Qunix)
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7198 && !inhibit_eol_conversion)
90378
0aec08f4c729 (decode_eol): Pay attention to buffer relocation in
Kenichi Handa <handa@m17n.org>
parents: 90363
diff changeset
7199 decode_eol (coding);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7200 if (BUFFERP (coding->dst_object))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7201 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7202 current_buffer->undo_list = undo_list;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7203 record_insert (coding->dst_pos, coding->produced_char);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7204 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7205 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7206 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7207
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7208
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
7209 /* Extract an annotation datum from a composition starting at POS and
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7210 ending before LIMIT of CODING->src_object (buffer or string), store
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7211 the data in BUF, set *STOP to a starting position of the next
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7212 composition (if any) or to LIMIT, and return the address of the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7213 next element of BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7214
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7215 If such an annotation is not found, set *STOP to a starting
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7216 position of a composition after POS (if any) or to LIMIT, and
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7217 return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7218
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7219 static INLINE int *
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7220 handle_composition_annotation (pos, limit, coding, buf, stop)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7221 EMACS_INT pos, limit;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7222 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7223 int *buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7224 EMACS_INT *stop;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7225 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7226 EMACS_INT start, end;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7227 Lisp_Object prop;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7228
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7229 if (! find_composition (pos, limit, &start, &end, &prop, coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7230 || end > limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7231 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7232 else if (start > pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7233 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7234 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7235 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7236 if (start == pos)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7237 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7238 /* We found a composition. Store the corresponding
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7239 annotation data in BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7240 int *head = buf;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7241 enum composition_method method = COMPOSITION_METHOD (prop);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7242 int nchars = COMPOSITION_LENGTH (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7243
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7244 ADD_COMPOSITION_DATA (buf, nchars, 0, method);
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7245 if (method != COMPOSITION_RELATIVE)
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7246 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7247 Lisp_Object components;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7248 int len, i, i_byte;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7249
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7250 components = COMPOSITION_COMPONENTS (prop);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7251 if (VECTORP (components))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7252 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7253 len = XVECTOR (components)->size;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7254 for (i = 0; i < len; i++)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7255 *buf++ = XINT (AREF (components, i));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7256 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7257 else if (STRINGP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7258 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7259 len = SCHARS (components);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7260 i = i_byte = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7261 while (i < len)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7262 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7263 FETCH_STRING_CHAR_ADVANCE (*buf, components, i, i_byte);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7264 buf++;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7265 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7266 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7267 else if (INTEGERP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7268 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7269 len = 1;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7270 *buf++ = XINT (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7271 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7272 else if (CONSP (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7273 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7274 for (len = 0; CONSP (components);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7275 len++, components = XCDR (components))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7276 *buf++ = XINT (XCAR (components));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7277 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7278 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7279 abort ();
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7280 *head -= len;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7281 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7282 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7283
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7284 if (find_composition (end, limit, &start, &end, &prop,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7285 coding->src_object)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7286 && end <= limit)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7287 *stop = start;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7288 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7289 *stop = limit;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7290 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7291 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7292 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7293
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7294
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
7295 /* Extract an annotation datum from a text property `charset' at POS of
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7296 CODING->src_object (buffer of string), store the data in BUF, set
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7297 *STOP to the position where the value of `charset' property changes
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7298 (limiting by LIMIT), and return the address of the next element of
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7299 BUF.
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7300
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7301 If the property value is nil, set *STOP to the position where the
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7302 property value is non-nil (limiting by LIMIT), and return BUF. */
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7303
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7304 static INLINE int *
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7305 handle_charset_annotation (pos, limit, coding, buf, stop)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7306 EMACS_INT pos, limit;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7307 struct coding_system *coding;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7308 int *buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7309 EMACS_INT *stop;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7310 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7311 Lisp_Object val, next;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7312 int id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7313
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7314 val = Fget_text_property (make_number (pos), Qcharset, coding->src_object);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7315 if (! NILP (val) && CHARSETP (val))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7316 id = XINT (CHARSET_SYMBOL_ID (val));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7317 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7318 id = -1;
89852
b636ae1109c6 (MAX_ANNOTATION_LENGTH): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 89851
diff changeset
7319 ADD_CHARSET_DATA (buf, 0, id);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7320 next = Fnext_single_property_change (make_number (pos), Qcharset,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7321 coding->src_object,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7322 make_number (limit));
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7323 *stop = XINT (next);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7324 return buf;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7325 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7326
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7327
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7328 static void
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7329 consume_chars (coding, translation_table, max_lookup)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7330 struct coding_system *coding;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7331 Lisp_Object translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7332 int max_lookup;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7333 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7334 int *buf = coding->charbuf;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7335 int *buf_end = coding->charbuf + coding->charbuf_size;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
7336 const unsigned char *src = coding->source + coding->consumed;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7337 const unsigned char *src_end = coding->source + coding->src_bytes;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7338 EMACS_INT pos = coding->src_pos + coding->consumed_char;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7339 EMACS_INT end_pos = coding->src_pos + coding->src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7340 int multibytep = coding->src_multibyte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7341 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7342 int c;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7343 EMACS_INT stop, stop_composition, stop_charset;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7344 int *lookup_buf = NULL;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7345
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7346 if (! NILP (translation_table))
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7347 lookup_buf = alloca (sizeof (int) * max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7348
102334
7baaea85626e (decode_coding_utf_8, decode_coding_utf_16, decode_coding_emacs_mule,
Eli Zaretskii <eliz@gnu.org>
parents: 102327
diff changeset
7349 eol_type = inhibit_eol_conversion ? Qunix : CODING_ID_EOL_TYPE (coding->id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7350 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7351 eol_type = Qunix;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7352
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7353 /* Note: composition handling is not yet implemented. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7354 coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7355
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7356 if (NILP (coding->src_object))
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7357 stop = stop_composition = stop_charset = end_pos;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7358 else
89562
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7359 {
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7360 if (coding->common_flags & CODING_ANNOTATE_COMPOSITION_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7361 stop = stop_composition = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7362 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7363 stop = stop_composition = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7364 if (coding->common_flags & CODING_ANNOTATE_CHARSET_MASK)
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7365 stop = stop_charset = pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7366 else
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7367 stop_charset = end_pos;
12fbcfebb9ad (consume_chars): If coding->src_object is nil, don't check annotation.
Kenichi Handa <handa@m17n.org>
parents: 89545
diff changeset
7368 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7369
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7370 /* Compensate for CRLF and conversion. */
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7371 buf_end -= 1 + MAX_ANNOTATION_LENGTH;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7372 while (buf < buf_end)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7373 {
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7374 Lisp_Object trans;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7375
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7376 if (pos == stop)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7377 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7378 if (pos == end_pos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7379 break;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7380 if (pos == stop_composition)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7381 buf = handle_composition_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7382 buf, &stop_composition);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7383 if (pos == stop_charset)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7384 buf = handle_charset_annotation (pos, end_pos, coding,
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7385 buf, &stop_charset);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7386 stop = (stop_composition < stop_charset
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7387 ? stop_composition : stop_charset);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7388 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7389
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7390 if (! multibytep)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7391 {
89462
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
7392 EMACS_INT bytes;
4e359ebf3984 (decode_coding_iso_2022): Fix handling of invalid
Kenichi Handa <handa@m17n.org>
parents: 89448
diff changeset
7393
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7394 if (coding->encoder == encode_coding_raw_text)
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7395 c = *src++, pos++;
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7396 else if ((bytes = MULTIBYTE_LENGTH (src, src_end)) > 0)
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
7397 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos += bytes;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7398 else
89917
1763eef5ad02 (encode_coding_utf_8): Fix handling of raw-byte char.
Kenichi Handa <handa@m17n.org>
parents: 89905
diff changeset
7399 c = BYTE8_TO_CHAR (*src), src++, pos++;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7400 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7401 else
92992
49c4ea77b83a (CHAR_STRING_ADVANCE_NO_UNIFY)
Kenichi Handa <handa@m17n.org>
parents: 92458
diff changeset
7402 c = STRING_CHAR_ADVANCE_NO_UNIFY (src), pos++;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7403 if ((c == '\r') && (coding->mode & CODING_MODE_SELECTIVE_DISPLAY))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7404 c = '\n';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7405 if (! EQ (eol_type, Qunix))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7406 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7407 if (c == '\n')
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
7408 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7409 if (EQ (eol_type, Qdos))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7410 *buf++ = '\r';
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7411 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7412 c = '\r';
32443
57fa108c491f (code_convert_region): Be sure to initialize coding->category_idx.
Kenichi Handa <handa@m17n.org>
parents: 31458
diff changeset
7413 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7414 }
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7415
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
7416 trans = Qnil;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7417 LOOKUP_TRANSLATION_TABLE (translation_table, c, trans);
89858
23cb9ed79225 (get_translation_table): Declare it as Lisp_Object.
Kenichi Handa <handa@m17n.org>
parents: 89856
diff changeset
7418 if (NILP (trans))
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7419 *buf++ = c;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7420 else
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7421 {
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7422 int from_nchars = 1, to_nchars = 1;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7423 int *lookup_buf_end;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7424 const unsigned char *p = src;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7425 int i;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7426
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7427 lookup_buf[0] = c;
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7428 for (i = 1; i < max_lookup && p < src_end; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7429 lookup_buf[i] = STRING_CHAR_ADVANCE (p);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7430 lookup_buf_end = lookup_buf + i;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7431 trans = get_translation (trans, lookup_buf, lookup_buf_end);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7432 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7433 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7434 else if (CONSP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7435 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7436 from_nchars = ASIZE (XCAR (trans));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7437 trans = XCDR (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7438 if (INTEGERP (trans))
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7439 c = XINT (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7440 else
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7441 {
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7442 to_nchars = ASIZE (trans);
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7443 if (buf + to_nchars > buf_end)
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7444 break;
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7445 c = XINT (AREF (trans, 0));
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7446 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7447 }
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7448 else
23881
20d595402dea (DECODE_DESIGNATION): Jump to label_invalid_code if
Kenichi Handa <handa@m17n.org>
parents: 23564
diff changeset
7449 break;
102422
82f82b92314e (CODING_ISO_CMP_STATUS): New macro.
Kenichi Handa <handa@m17n.org>
parents: 102334
diff changeset
7450 *buf++ = c;
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7451 for (i = 1; i < to_nchars; i++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7452 *buf++ = XINT (AREF (trans, i));
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7453 for (i = 1; i < from_nchars; i++, pos++)
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7454 src += MULTIBYTE_LENGTH_NO_CHECK (src);
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
7455 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7456 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7457
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7458 coding->consumed = src - coding->source;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7459 coding->consumed_char = pos - coding->src_pos;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7460 coding->charbuf_used = buf - coding->charbuf;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7461 coding->chars_at_source = 0;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7462 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7463
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7464
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7465 /* Encode the text at CODING->src_object into CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7466 CODING->src_object is a buffer or a string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7467 CODING->dst_object is a buffer or nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7468
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7469 If CODING->src_object is a buffer, it must be the current buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7470 In this case, if CODING->src_pos is positive, it is a position of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7471 the source text in the buffer, otherwise. the source text is in the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7472 gap area of the buffer, and coding->src_pos specifies the offset of
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7473 the text from GPT (which must be the same as PT). If this is the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7474 same buffer as CODING->dst_object, CODING->src_pos must be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7475 negative and CODING should not have `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7476
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7477 If CODING->src_object is a string, CODING should not have
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7478 `pre-write-conversion'.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7479
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7480 If CODING->dst_object is a buffer, the encoded data is inserted at
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7481 the current point of that buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7482
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7483 If CODING->dst_object is nil, the encoded data is placed at the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7484 memory area specified by CODING->destination. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7485
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7486 static int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7487 encode_coding (coding)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7488 struct coding_system *coding;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7489 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7490 Lisp_Object attrs;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
7491 Lisp_Object translation_table;
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7492 int max_lookup;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7493
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7494 attrs = CODING_ID_ATTRS (coding->id);
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7495 if (coding->encoder == encode_coding_raw_text)
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7496 translation_table = Qnil, max_lookup = 0;
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7497 else
89933
48af0ea7d387 (setup_coding_system): Set coding->common_flags
Kenichi Handa <handa@m17n.org>
parents: 89924
diff changeset
7498 translation_table = get_translation_table (attrs, 1, &max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7499
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7500 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7501 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7502 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7503 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7504 = ! NILP (current_buffer->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7505 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7506
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7507 coding->consumed = coding->consumed_char = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7508 coding->produced = coding->produced_char = 0;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7509 record_conversion_result (coding, CODING_RESULT_SUCCESS);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7510 coding->errors = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7511
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7512 ALLOC_CONVERSION_WORK_AREA (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7513
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7514 do {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7515 coding_set_source (coding);
89859
b706c5ee6492 (get_translation_table): New arg max_lookup. Caller changed.
Kenichi Handa <handa@m17n.org>
parents: 89858
diff changeset
7516 consume_chars (coding, translation_table, max_lookup);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7517 coding_set_destination (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7518 (*(coding->encoder)) (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7519 } while (coding->consumed_char < coding->src_chars);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7520
90809
3c52757d5f6e (produce_chars): Don't call insert_from_gap if no
Kenichi Handa <handa@m17n.org>
parents: 90772
diff changeset
7521 if (BUFFERP (coding->dst_object) && coding->produced_char > 0)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7522 insert_from_gap (coding->produced_char, coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7523
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7524 return (coding->result);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7525 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7526
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7527
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7528 /* Name (or base name) of work buffer for code conversion. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7529 static Lisp_Object Vcode_conversion_workbuf_name;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7530
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7531 /* A working buffer used by the top level conversion. Once it is
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7532 created, it is never destroyed. It has the name
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7533 Vcode_conversion_workbuf_name. The other working buffers are
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7534 destroyed after the use is finished, and their names are modified
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7535 versions of Vcode_conversion_workbuf_name. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7536 static Lisp_Object Vcode_conversion_reused_workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7537
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7538 /* 1 iff Vcode_conversion_reused_workbuf is already in use. */
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7539 static int reused_workbuf_in_use;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7540
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7541
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7542 /* Return a working buffer of code convesion. MULTIBYTE specifies the
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7543 multibyteness of returning buffer. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7544
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7545 static Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7546 make_conversion_work_buffer (multibyte)
89863
428fc37b2ae6 Add many prototypes for static functions.
Kenichi Handa <handa@m17n.org>
parents: 89861
diff changeset
7547 int multibyte;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7548 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7549 Lisp_Object name, workbuf;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7550 struct buffer *current;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7551
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7552 if (reused_workbuf_in_use++)
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7553 {
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7554 name = Fgenerate_new_buffer_name (Vcode_conversion_workbuf_name, Qnil);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7555 workbuf = Fget_buffer_create (name);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7556 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7557 else
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7558 {
99074
10cd979d05ca (make_conversion_work_buffer): Check that Vcode_conversion_reused_workbuf
Noah Friedman <friedman@splode.com>
parents: 98992
diff changeset
7559 if (NILP (Fbuffer_live_p (Vcode_conversion_reused_workbuf)))
98186
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7560 Vcode_conversion_reused_workbuf
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7561 = Fget_buffer_create (Vcode_conversion_workbuf_name);
1cfa973fde14 (make_conversion_work_buffer): Avoid calling
Kenichi Handa <handa@m17n.org>
parents: 96571
diff changeset
7562 workbuf = Vcode_conversion_reused_workbuf;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7563 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7564 current = current_buffer;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7565 set_buffer_internal (XBUFFER (workbuf));
100262
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7566 /* We can't allow modification hooks to run in the work buffer. For
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7567 instance, directory_files_internal assumes that file decoding
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7568 doesn't compile new regexps. */
46114a72fb0e (make_conversion_work_buffer): Disable buffer modification hooks in
Chong Yidong <cyd@stupidchicken.com>
parents: 100176
diff changeset
7569 Fset (Fmake_local_variable (Qinhibit_modification_hooks), Qt);
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
7570 Ferase_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7571 current_buffer->undo_list = Qt;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7572 current_buffer->enable_multibyte_characters = multibyte ? Qt : Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7573 set_buffer_internal (current);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7574 return workbuf;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7575 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7576
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7577
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7578 static Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7579 code_conversion_restore (arg)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7580 Lisp_Object arg;
26067
f54ca66e2571 (code_convert_string): Add record_unwind_protect to
Kenichi Handa <handa@m17n.org>
parents: 25860
diff changeset
7581 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7582 Lisp_Object current, workbuf;
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7583 struct gcpro gcpro1;
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7584
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7585 GCPRO1 (arg);
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7586 current = XCAR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7587 workbuf = XCDR (arg);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7588 if (! NILP (workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7589 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7590 if (EQ (workbuf, Vcode_conversion_reused_workbuf))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7591 reused_workbuf_in_use = 0;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7592 else if (! NILP (Fbuffer_live_p (workbuf)))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7593 Fkill_buffer (workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7594 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7595 set_buffer_internal (XBUFFER (current));
90263
80fb4c061e99 (code_conversion_restore): GCPRO arg.
Kenichi Handa <handa@m17n.org>
parents: 90261
diff changeset
7596 UNGCPRO;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7597 return Qnil;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7598 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7599
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7600 Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7601 code_conversion_save (with_work_buf, multibyte)
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7602 int with_work_buf, multibyte;
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7603 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7604 Lisp_Object workbuf = Qnil;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7605
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7606 if (with_work_buf)
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7607 workbuf = make_conversion_work_buffer (multibyte);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7608 record_unwind_protect (code_conversion_restore,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7609 Fcons (Fcurrent_buffer (), workbuf));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7610 return workbuf;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7611 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
7612
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7613 int
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7614 decode_coding_gap (coding, chars, bytes)
29725
2bc397e9b09a (setup_coding_system) <4>: Reset member `cr_carryover'.
Kenichi Handa <handa@m17n.org>
parents: 29663
diff changeset
7615 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7616 EMACS_INT chars, bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7617 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7618 int count = specpdl_ptr - specpdl;
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7619 Lisp_Object attrs;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7620
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7621 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7622
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7623 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7624 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7625 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7626 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7627 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7628 coding->src_multibyte = chars < bytes;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7629 coding->dst_object = coding->src_object;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7630 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7631 coding->dst_pos_byte = PT_BYTE;
88443
6b86cf30a0b9 (produce_chars): Set the variable `multibytep' correctly.
Kenichi Handa <handa@m17n.org>
parents: 88438
diff changeset
7632 coding->dst_multibyte = ! NILP (current_buffer->enable_multibyte_characters);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7633
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7634 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7635 detect_coding (coding);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
7636
90350
60eaefb08cf7 (DECODE_COMPOSITION_START): If the source is short, set
Kenichi Handa <handa@m17n.org>
parents: 90346
diff changeset
7637 coding->mode |= CODING_MODE_LAST_BLOCK;
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7638 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7639 decode_coding (coding);
90772
b15334b4a9c3 (coding_alloc_by_making_gap): New arg offset.
Kenichi Handa <handa@m17n.org>
parents: 90737
diff changeset
7640 current_buffer->text->inhibit_shrinking = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7641
89448
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7642 attrs = CODING_ID_ATTRS (coding->id);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7643 if (! NILP (CODING_ATTR_POST_READ (attrs)))
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7644 {
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7645 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7646 Lisp_Object val;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7647
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7648 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7649 val = call1 (CODING_ATTR_POST_READ (attrs),
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7650 make_number (coding->produced_char));
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7651 CHECK_NATNUM (val);
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7652 coding->produced_char += Z - prev_Z;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7653 coding->produced += Z_BYTE - prev_Z_BYTE;
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7654 }
de8b460070cc (setup_coding_system): If coding has
Kenichi Handa <handa@m17n.org>
parents: 89446
diff changeset
7655
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7656 unbind_to (count, Qnil);
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7657 return coding->result;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7658 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7659
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7660 int
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7661 encode_coding_gap (coding, chars, bytes)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7662 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7663 EMACS_INT chars, bytes;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7664 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7665 int count = specpdl_ptr - specpdl;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7666
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7667 code_conversion_save (0, 0);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7668
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7669 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7670 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7671 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7672 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7673 coding->src_pos_byte = -bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7674 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7675 coding->dst_object = coding->src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7676 coding->dst_pos = PT;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7677 coding->dst_pos_byte = PT_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7678
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7679 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7680
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7681 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7682 return coding->result;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7683 }
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7684
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7685
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7686 /* Decode the text in the range FROM/FROM_BYTE and TO/TO_BYTE in
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7687 SRC_OBJECT into DST_OBJECT by coding context CODING.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7688
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7689 SRC_OBJECT is a buffer, a string, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7691 If it is a buffer, the text is at point of the buffer. FROM and TO
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7692 are positions in the buffer.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7693
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7694 If it is a string, the text is at the beginning of the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7695 FROM and TO are indices to the string.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7696
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7697 If it is nil, the text is at coding->source. FROM and TO are
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7698 indices to coding->source.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7699
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7700 DST_OBJECT is a buffer, Qt, or Qnil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7701
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7702 If it is a buffer, the decoded text is inserted at point of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7703 buffer. If the buffer is the same as SRC_OBJECT, the source text
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7704 is deleted.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7705
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7706 If it is Qt, a string is made from the decoded text, and
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7707 set in CODING->dst_object.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7708
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7709 If it is Qnil, the decoded text is stored at CODING->destination.
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7710 The caller must allocate CODING->dst_bytes bytes at
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7711 CODING->destination by xmalloc. If the decoded text is longer than
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7712 CODING->dst_bytes, CODING->destination is relocated by xrealloc.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7713 */
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7714
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7715 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7716 decode_coding_object (coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7717 dst_object)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7718 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7719 Lisp_Object src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7720 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7721 Lisp_Object dst_object;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7722 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7723 int count = specpdl_ptr - specpdl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7724 unsigned char *destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7725 EMACS_INT dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7726 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7727 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7728 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7729 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7730 int need_marker_adjustment = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7731 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7732
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7733 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7734
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7735 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7736 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7737 destination = coding->destination;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7738 dst_bytes = coding->dst_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7739 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7740
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7741 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7742 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7743 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7744 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7745
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7746 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7747 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7748 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7749 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7750 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7751 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7752 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7753 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7754 if (from != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7755 move_gap_both (from, from_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7756 if (EQ (src_object, dst_object))
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7757 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7758 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7759
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7760 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7761 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7762 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7763 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7764 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7765 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7766 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7767 TEMP_SET_PT_BOTH (from, from_byte);
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7768 current_buffer->text->inhibit_shrinking = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7769 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7770 coding->src_pos = -chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7771 coding->src_pos_byte = -bytes;
20931
068eb408c911 (decode_coding_iso2022): Update coding->fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents: 20803
diff changeset
7772 }
42661
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7773 else
e85e4d9494b1 (code_convert_region): Don't copy old text if undo disabled.
Richard M. Stallman <rms@gnu.org>
parents: 42105
diff changeset
7774 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7775 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7776 coding->src_pos_byte = from_byte;
29985
c17e78d8c720 (code_convert_region): Even if the length of text is
Kenichi Handa <handa@m17n.org>
parents: 29932
diff changeset
7777 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7778 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7779
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7780 if (CODING_REQUIRE_DETECTION (coding))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7781 detect_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7782 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7783
89418
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7784 if (EQ (dst_object, Qt)
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7785 || (! NILP (CODING_ATTR_POST_READ (attrs))
a9c2b3712863 (coding_set_source): Fix for the case that the current
Kenichi Handa <handa@m17n.org>
parents: 89404
diff changeset
7786 && NILP (dst_object)))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7787 {
93321
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7788 coding->dst_multibyte = !CODING_FOR_UNIBYTE (coding);
c3fe9ef79b56 (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93197
diff changeset
7789 coding->dst_object = code_conversion_save (1, coding->dst_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7790 coding->dst_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7791 coding->dst_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7792 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7793 else if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7794 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7795 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7796 coding->dst_object = dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7797 coding->dst_pos = BUF_PT (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7798 coding->dst_pos_byte = BUF_PT_BYTE (XBUFFER (dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7799 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7800 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7801 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
7802 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
7803 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7804 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7805 coding->dst_object = Qnil;
93322
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7806 /* Most callers presume this will return a multibyte result, and they
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7807 won't use `binary' or `raw-text' anyway, so let's not worry about
3b82aab9d8fc (decode_coding_object): Revert part of last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93321
diff changeset
7808 CODING_FOR_UNIBYTE. */
93323
06e93ffa2e9f (decode_coding_object): Fix last change.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 93322
diff changeset
7809 coding->dst_multibyte = 1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7810 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7811
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7812 decode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7813
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7814 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7815 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7816
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7817 if (! NILP (CODING_ATTR_POST_READ (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7818 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7819 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7820 EMACS_INT prev_Z = Z, prev_Z_BYTE = Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7821 Lisp_Object val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7822
88506
a7f0d13affa5 (decode_coding_object): Move point to coding->dst_pos before
Kenichi Handa <handa@m17n.org>
parents: 88497
diff changeset
7823 TEMP_SET_PT_BOTH (coding->dst_pos, coding->dst_pos_byte);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7824 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7825 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7826 val = safe_call1 (CODING_ATTR_POST_READ (attrs),
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7827 make_number (coding->produced_char));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7828 UNGCPRO;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7829 CHECK_NATNUM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7830 coding->produced_char += Z - prev_Z;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7831 coding->produced += Z_BYTE - prev_Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7832 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7833
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7834 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7835 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7836 coding->dst_object = Fbuffer_string ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7837 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7838 else if (NILP (dst_object) && BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7839 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7840 set_buffer_internal (XBUFFER (coding->dst_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7841 if (dst_bytes < coding->produced)
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
7842 {
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7843 destination = xrealloc (destination, coding->produced);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7844 if (! destination)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7845 {
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7846 record_conversion_result (coding,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7847 CODING_RESULT_INSUFFICIENT_DST);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7848 unbind_to (count, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7849 return;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7850 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7851 if (BEGV < GPT && GPT < BEGV + coding->produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7852 move_gap_both (BEGV, BEGV_BYTE);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7853 bcopy (BEGV_ADDR, destination, coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7854 coding->destination = destination;
23279
ca159e828a68 (ccl_coding_driver): If ccl_driver is interrupted by a
Kenichi Handa <handa@m17n.org>
parents: 23258
diff changeset
7855 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7856 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7857
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7858 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7859 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7860 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7861 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7862 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7863 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7864 set_buffer_internal (XBUFFER (src_object));
92458
5f5f07a5c076 (decode_coding_object): Inhibit gap shrinking while
Andreas Schwab <schwab@suse.de>
parents: 92406
diff changeset
7865 current_buffer->text->inhibit_shrinking = 0;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7866 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7867 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7868 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7869 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7870 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7871 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7872 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7873 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7874 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7875 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7876
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7877 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7878 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7879 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7880
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7881 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7882 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7883 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7884 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7885 if (tail->insertion_type)
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7886 {
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7887 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7888 tail->charpos = from;
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7889 }
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7890 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7891 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7892 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7893 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7894 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7895 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7896 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7897 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7898 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7899 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7900
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7901 Vdeactivate_mark = old_deactivate_mark;
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
7902 unbind_to (count, coding->dst_object);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7903 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7904
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
7905
29275
b4ea9178e480 (DECODE_COMPOSITION_START): If coding->cmp_data is not
Kenichi Handa <handa@m17n.org>
parents: 29247
diff changeset
7906 void
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7907 encode_coding_object (coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7908 dst_object)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7909 struct coding_system *coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7910 Lisp_Object src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7911 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7912 Lisp_Object dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7913 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7914 int count = specpdl_ptr - specpdl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7915 EMACS_INT chars = to - from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7916 EMACS_INT bytes = to_byte - from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7917 Lisp_Object attrs;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7918 int saved_pt = -1, saved_pt_byte;
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7919 int need_marker_adjustment = 0;
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7920 int kill_src_buffer = 0;
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7921 Lisp_Object old_deactivate_mark;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7922
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7923 old_deactivate_mark = Vdeactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7924
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7925 coding->src_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7926 coding->src_chars = chars;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7927 coding->src_bytes = bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7928 coding->src_multibyte = chars < bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7929
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7930 attrs = CODING_ID_ATTRS (coding->id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7931
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7932 if (EQ (src_object, dst_object))
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7933 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7934 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7935
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7936 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7937 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7938 tail->need_adjustment
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7939 = tail->charpos == (tail->insertion_type ? from : to);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7940 need_marker_adjustment |= tail->need_adjustment;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7941 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7942 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
7943
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7944 if (! NILP (CODING_ATTR_PRE_WRITE (attrs)))
21062
839b22ad1e42 (code_convert_region): Handle the case that codes
Kenichi Handa <handa@m17n.org>
parents: 20999
diff changeset
7945 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7946 coding->src_object = code_conversion_save (1, coding->src_multibyte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7947 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7948 if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7949 insert_from_string (src_object, from, from_byte, chars, bytes, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7950 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7951 insert_from_buffer (XBUFFER (src_object), from, chars, 0);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
7952 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7953 insert_1_both (coding->source + from, chars, bytes, 0, 0, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7954
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7955 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7956 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7957 set_buffer_internal (XBUFFER (src_object));
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7958 saved_pt = PT, saved_pt_byte = PT_BYTE;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7959 del_range_both (from, from_byte, to, to_byte, 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7960 set_buffer_internal (XBUFFER (coding->src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7961 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7962
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7963 {
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7964 Lisp_Object args[3];
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7965 struct gcpro gcpro1, gcpro2, gcpro3, gcpro4, gcpro5;
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7966
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7967 GCPRO5 (coding->src_object, coding->dst_object, src_object, dst_object,
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7968 old_deactivate_mark);
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7969 args[0] = CODING_ATTR_PRE_WRITE (attrs);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7970 args[1] = make_number (BEG);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7971 args[2] = make_number (Z);
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7972 safe_call (3, args);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
7973 UNGCPRO;
90131
503a3c779486 (decode_coding_object): Use safe_call1 instead of call1.
Kenichi Handa <handa@m17n.org>
parents: 90127
diff changeset
7974 }
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7975 if (XBUFFER (coding->src_object) != current_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
7976 kill_src_buffer = 1;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
7977 coding->src_object = Fcurrent_buffer ();
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7978 if (BEG != GPT)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7979 move_gap_both (BEG, BEG_BYTE);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7980 coding->src_chars = Z - BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7981 coding->src_bytes = Z_BYTE - BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7982 coding->src_pos = BEG;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7983 coding->src_pos_byte = BEG_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7984 coding->src_multibyte = Z < Z_BYTE;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7985 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7986 else if (STRINGP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7987 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7988 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7989 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7990 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7991 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7992 else if (BUFFERP (src_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7993 {
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
7994 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7995 set_buffer_internal (XBUFFER (src_object));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7996 if (EQ (src_object, dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
7997 {
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
7998 saved_pt = PT, saved_pt_byte = PT_BYTE;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
7999 coding->src_object = del_range_1 (from, to, 1, 1);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8000 coding->src_pos = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8001 coding->src_pos_byte = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8002 }
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
8003 else
42105
09cc243e2d14 (code_convert_region): Update coding->cmp_data->char_offset
Richard M. Stallman <rms@gnu.org>
parents: 42104
diff changeset
8004 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8005 if (from < GPT && to >= GPT)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8006 move_gap_both (from, from_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8007 coding->src_pos = from;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8008 coding->src_pos_byte = from_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8009 }
64308
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
8010 }
93129de4b8a4 (code_convert_region_unwind): ARG is changed to a cons.
Kenichi Handa <handa@m17n.org>
parents: 64251
diff changeset
8011 else
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8012 code_conversion_save (0, 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8013
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8014 if (BUFFERP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8015 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8016 coding->dst_object = dst_object;
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8017 if (EQ (src_object, dst_object))
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8018 {
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8019 coding->dst_pos = from;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8020 coding->dst_pos_byte = from_byte;
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8021 }
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8022 else
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8023 {
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8024 struct buffer *current = current_buffer;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8025
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8026 set_buffer_temp (XBUFFER (dst_object));
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8027 coding->dst_pos = PT;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8028 coding->dst_pos_byte = PT_BYTE;
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8029 move_gap_both (coding->dst_pos, coding->dst_pos_byte);
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
8030 set_buffer_temp (current);
89042
2b9f8973f240 (coding_set_destination): Fix coding->destination for
Kenichi Handa <handa@m17n.org>
parents: 88977
diff changeset
8031 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8032 coding->dst_multibyte
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8033 = ! NILP (XBUFFER (dst_object)->enable_multibyte_characters);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8034 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8035 else if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8036 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8037 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8038 coding->dst_bytes = coding->src_chars;
88510
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8039 if (coding->dst_bytes == 0)
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8040 coding->dst_bytes = 1;
d266b8fb8761 (encode_coding_object): Give correct arguments ot
Kenichi Handa <handa@m17n.org>
parents: 88506
diff changeset
8041 coding->destination = (unsigned char *) xmalloc (coding->dst_bytes);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8042 coding->dst_multibyte = 0;
65506
f376635f5061 (code_convert_region_unwind): Argument format changed.
Kenichi Handa <handa@m17n.org>
parents: 64770
diff changeset
8043 }
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8044 else
29172
46ad5a027334 (run_pre_post_conversion_on_str): Set point to the
Kenichi Handa <handa@m17n.org>
parents: 29093
diff changeset
8045 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8046 coding->dst_object = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8047 coding->dst_multibyte = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8048 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8049
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8050 encode_coding (coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8051
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8052 if (EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8053 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8054 if (BUFFERP (coding->dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8055 coding->dst_object = Fbuffer_string ();
23514
7bad909cd6f1 (setup_coding_system): Fix setting up
Kenichi Handa <handa@m17n.org>
parents: 23475
diff changeset
8056 else
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8057 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8058 coding->dst_object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8059 = make_unibyte_string ((char *) coding->destination,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8060 coding->produced);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8061 xfree (coding->destination);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8062 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8063 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8064
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8065 if (saved_pt >= 0)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8066 {
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8067 /* This is the case of:
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8068 (BUFFERP (src_object) && EQ (src_object, dst_object))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8069 As we have moved PT while replacing the original buffer
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8070 contents, we must recover it now. */
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8071 set_buffer_internal (XBUFFER (src_object));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8072 if (saved_pt < from)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8073 TEMP_SET_PT_BOTH (saved_pt, saved_pt_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8074 else if (saved_pt < from + chars)
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8075 TEMP_SET_PT_BOTH (from, from_byte);
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8076 else if (! NILP (current_buffer->enable_multibyte_characters))
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8077 TEMP_SET_PT_BOTH (saved_pt + (coding->produced_char - chars),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8078 saved_pt_byte + (coding->produced - bytes));
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8079 else
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8080 TEMP_SET_PT_BOTH (saved_pt + (coding->produced - bytes),
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8081 saved_pt_byte + (coding->produced - bytes));
91344
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8082
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8083 if (need_marker_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8084 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8085 struct Lisp_Marker *tail;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8086
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8087 for (tail = BUF_MARKERS (current_buffer); tail; tail = tail->next)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8088 if (tail->need_adjustment)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8089 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8090 tail->need_adjustment = 0;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8091 if (tail->insertion_type)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8092 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8093 tail->bytepos = from_byte;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8094 tail->charpos = from;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8095 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8096 else
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8097 {
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8098 tail->bytepos = from_byte + coding->produced;
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8099 tail->charpos
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8100 = (NILP (current_buffer->enable_multibyte_characters)
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8101 ? tail->bytepos : from + coding->produced_char);
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8102 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8103 }
56f3473b139e (decode_coding_object): Adjuste marker positions after
Kenichi Handa <handa@m17n.org>
parents: 91327
diff changeset
8104 }
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8105 }
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
8106
90231
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
8107 if (kill_src_buffer)
8be9e4c6d687 (encode_coding_object): If a pre-write-conversion
Kenichi Handa <handa@m17n.org>
parents: 90224
diff changeset
8108 Fkill_buffer (coding->src_object);
91838
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
8109
7bed61cbed0c (decode_coding_object, encode_coding_object): Preserve
Kenichi Handa <handa@m17n.org>
parents: 91807
diff changeset
8110 Vdeactivate_mark = old_deactivate_mark;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8111 unbind_to (count, Qnil);
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8112 }
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8113
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
8114
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
8115 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8116 preferred_coding_system ()
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8117 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8118 int id = coding_categories[coding_priorities[0]].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8119
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8120 return CODING_ID_NAME (id);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8121 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8122
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8123
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8124 #ifdef emacs
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
8125 /*** 8. Emacs Lisp library functions ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8126
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8127 DEFUN ("coding-system-p", Fcoding_system_p, Scoding_system_p, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8128 doc: /* Return t if OBJECT is nil or a coding-system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8129 See the documentation of `define-coding-system' for information
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8130 about coding-system objects. */)
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8131 (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8132 Lisp_Object object;
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8133 {
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8134 if (NILP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8135 || CODING_SYSTEM_ID (object) >= 0)
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8136 return Qt;
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8137 if (! SYMBOLP (object)
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8138 || NILP (Fget (object, Qcoding_system_define_form)))
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8139 return Qnil;
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
8140 return Qt;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8141 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8142
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8143 DEFUN ("read-non-nil-coding-system", Fread_non_nil_coding_system,
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8144 Sread_non_nil_coding_system, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8145 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8146 (prompt)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8147 Lisp_Object prompt;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8148 {
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
8149 Lisp_Object val;
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8150 do
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8151 {
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8152 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8153 Qt, Qnil, Qcoding_system_history, Qnil, Qnil);
17717
4891aaecc5cc (Fread_coding_system, Fread_non_nil_coding_system):
Richard M. Stallman <rms@gnu.org>
parents: 17485
diff changeset
8154 }
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8155 while (SCHARS (val) == 0);
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
8156 return (Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8157 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8158
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8159 DEFUN ("read-coding-system", Fread_coding_system, Sread_coding_system, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8160 doc: /* Read a coding system from the minibuffer, prompting with string PROMPT.
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8161 If the user enters null input, return second argument DEFAULT-CODING-SYSTEM.
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8162 Ignores case when completing coding systems (all Emacs coding systems
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8163 are lower-case). */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8164 (prompt, default_coding_system)
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8165 Lisp_Object prompt, default_coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8166 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
8167 Lisp_Object val;
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8168 int count = SPECPDL_INDEX ();
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8169
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8170 if (SYMBOLP (default_coding_system))
45396
cab845213388 * coding.c (Fread_coding_system, code_convert_region1)
Ken Raeburn <raeburn@raeburn.org>
parents: 45239
diff changeset
8171 default_coding_system = SYMBOL_NAME (default_coding_system);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8172 specbind (Qcompletion_ignore_case, Qt);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
8173 val = Fcompleting_read (prompt, Vcoding_system_alist, Qnil,
19758
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8174 Qt, Qnil, Qcoding_system_history,
49a1662b68dd (Fread_coding_system): New optional arg DEFAULT_CODING_SYSTEM.
Richard M. Stallman <rms@gnu.org>
parents: 19750
diff changeset
8175 default_coding_system, Qnil);
79107
cce707ee192e (Qcompletion_ignore_case): New external Lisp_Object.
Glenn Morris <rgm@gnu.org>
parents: 78313
diff changeset
8176 unbind_to (count, Qnil);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8177 return (SCHARS (val) == 0 ? Qnil : Fintern (val, Qnil));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8178 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8179
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8180 DEFUN ("check-coding-system", Fcheck_coding_system, Scheck_coding_system,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8181 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8182 doc: /* Check validity of CODING-SYSTEM.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8183 If valid, return CODING-SYSTEM, else signal a `coding-system-error' error.
89892
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
8184 It is valid if it is nil or a symbol defined as a coding system by the
a2109a2c25d5 Sync to HEAD.
Kenichi Handa <handa@m17n.org>
parents: 89873
diff changeset
8185 function `define-coding-system'. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8186 (coding_system)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8187 Lisp_Object coding_system;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8188 {
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8189 Lisp_Object define_form;
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8190
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8191 define_form = Fget (coding_system, Qcoding_system_define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8192 if (! NILP (define_form))
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8193 {
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8194 Fput (coding_system, Qcoding_system_define_form, Qnil);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8195 safe_eval (define_form);
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
8196 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8197 if (!NILP (Fcoding_system_p (coding_system)))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8198 return coding_system;
71972
eaa3c19b94d2 (Fcheck_coding_system): Use xsignal1. Remove loop.
Kim F. Storm <storm@cua.dk>
parents: 71084
diff changeset
8199 xsignal1 (Qcoding_system_error, coding_system);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8200 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8201
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8202
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8203 /* Detect how the bytes at SRC of length SRC_BYTES are encoded. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8204 HIGHEST is nonzero, return the coding system of the highest
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8205 priority among the detected coding systems. Otherwize return a
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8206 list of detected coding systems sorted by their priorities. If
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8207 MULTIBYTEP is nonzero, it is assumed that the bytes are in correct
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8208 multibyte form but contains only ASCII and eight-bit chars.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8209 Otherwise, the bytes are raw bytes.
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8210
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8211 CODING-SYSTEM controls the detection as below:
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8212
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8213 If it is nil, detect both text-format and eol-format. If the
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8214 text-format part of CODING-SYSTEM is already specified
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8215 (e.g. `iso-latin-1'), detect only eol-format. If the eol-format
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8216 part of CODING-SYSTEM is already specified (e.g. `undecided-unix'),
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8217 detect only text-format. */
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8218
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8219 Lisp_Object
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8220 detect_coding_system (src, src_chars, src_bytes, highest, multibytep,
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8221 coding_system)
46548
cb1914307488 (encode_eol, detect_coding, detect_eol):
Ken Raeburn <raeburn@raeburn.org>
parents: 46462
diff changeset
8222 const unsigned char *src;
91807
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
8223 EMACS_INT src_chars, src_bytes;
507bcfb4342c * coding.c (coding_set_destination): Use BEG_BYTE rather than hardcoding 1.
Stefan Monnier <monnier@iro.umontreal.ca>
parents: 91622
diff changeset
8224 int highest;
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8225 int multibytep;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8226 Lisp_Object coding_system;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8227 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8228 const unsigned char *src_end = src + src_bytes;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8229 Lisp_Object attrs, eol_type;
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8230 Lisp_Object val = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8231 struct coding_system coding;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8232 int id;
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8233 struct coding_detection_info detect_info;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8234 enum coding_category base_category;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8235 int null_byte_found = 0, eight_bit_found = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8236
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8237 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8238 coding_system = Qundecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8239 setup_coding_system (coding_system, &coding);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8240 attrs = CODING_ID_ATTRS (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8241 eol_type = CODING_ID_EOL_TYPE (coding.id);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8242 coding_system = CODING_ATTR_BASE_NAME (attrs);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8243
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8244 coding.source = src;
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8245 coding.src_chars = src_chars;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8246 coding.src_bytes = src_bytes;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8247 coding.src_multibyte = multibytep;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8248 coding.consumed = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8249 coding.mode |= CODING_MODE_LAST_BLOCK;
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8250 coding.head_ascii = 0;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8251
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8252 detect_info.checked = detect_info.found = detect_info.rejected = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8253
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8254 /* At first, detect text-format if necessary. */
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8255 base_category = XINT (CODING_ATTR_CATEGORY (attrs));
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8256 if (base_category == coding_category_undecided)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8257 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8258 enum coding_category category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8259 struct coding_system *this;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8260 int c, i;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8261
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8262 /* Skip all ASCII bytes except for a few ISO2022 controls. */
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8263 for (; src < src_end; src++)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8264 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8265 c = *src;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8266 if (c & 0x80)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8267 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8268 eight_bit_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8269 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8270 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8271 }
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8272 else if (c < 0x20)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8273 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8274 if ((c == ISO_CODE_ESC || c == ISO_CODE_SI || c == ISO_CODE_SO)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8275 && ! inhibit_iso_escape_detection
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8276 && ! detect_info.checked)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8277 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8278 if (detect_coding_iso_2022 (&coding, &detect_info))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8279 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8280 /* We have scanned the whole data. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8281 if (! (detect_info.rejected & CATEGORY_MASK_ISO_7_ELSE))
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8282 {
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8283 /* We didn't find an 8-bit code. We may
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8284 have found a null-byte, but it's very
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8285 rare that a binary file confirm to
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8286 ISO-2022. */
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8287 src = src_end;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8288 coding.head_ascii = src - coding.source;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8289 }
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8290 detect_info.rejected |= ~CATEGORY_MASK_ISO_ESCAPE;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8291 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8292 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8293 }
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
8294 else if (! c && !inhibit_null_byte_detection)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8295 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8296 null_byte_found = 1;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8297 if (eight_bit_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8298 break;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8299 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8300 if (! eight_bit_found)
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8301 coding.head_ascii++;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8302 }
95585
862c7386145c (detect_coding): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95533
diff changeset
8303 else if (! eight_bit_found)
95533
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8304 coding.head_ascii++;
831c8ee4d884 (detect_coding): Fix handling of coding->head_ascii.
Kenichi Handa <handa@m17n.org>
parents: 95397
diff changeset
8305 }
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8306
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8307 if (null_byte_found || eight_bit_found
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8308 || coding.head_ascii < coding.src_bytes
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8309 || detect_info.found)
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8310 {
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8311 if (coding.head_ascii == coding.src_bytes)
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8312 /* As all bytes are 7-bit, we can ignore non-ISO-2022 codings. */
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8313 for (i = 0; i < coding_category_raw_text; i++)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8314 {
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8315 category = coding_priorities[i];
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8316 this = coding_categories + category;
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8317 if (detect_info.found & (1 << category))
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8318 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8319 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8320 else
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8321 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8322 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8323 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8324 detect_info.checked |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8325 detect_info.rejected |= ~CATEGORY_MASK_UTF_16;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8326 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8327 for (i = 0; i < coding_category_raw_text; i++)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8328 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8329 category = coding_priorities[i];
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8330 this = coding_categories + category;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8331
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8332 if (this->id < 0)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8333 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8334 /* No coding system of this category is defined. */
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8335 detect_info.rejected |= (1 << category);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8336 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8337 else if (category >= coding_category_raw_text)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8338 continue;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8339 else if (detect_info.checked & (1 << category))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8340 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8341 if (highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8342 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8343 break;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8344 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8345 else if ((*(this->detector)) (&coding, &detect_info)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8346 && highest
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8347 && (detect_info.found & (1 << category)))
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8348 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8349 if (category == coding_category_utf_16_auto)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8350 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8351 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8352 category = coding_category_utf_16_le;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8353 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8354 category = coding_category_utf_16_be;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8355 }
89974
2fef8edebd5c (detect_coding_utf_16): Don't set detect_info->found if
Kenichi Handa <handa@m17n.org>
parents: 89933
diff changeset
8356 break;
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8357 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8358 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8359 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8360 }
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8361
101197
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8362 if ((detect_info.rejected & CATEGORY_MASK_ANY) == CATEGORY_MASK_ANY
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8363 || null_byte_found)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8364 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8365 detect_info.found = CATEGORY_MASK_RAW_TEXT;
101197
ee5f395f3c19 (detect_coding_system): Fix handling of null_byte_fount.
Kenichi Handa <handa@m17n.org>
parents: 101174
diff changeset
8366 id = CODING_SYSTEM_ID (Qno_conversion);
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8367 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8368 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8369 else if (! detect_info.rejected && ! detect_info.found)
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8370 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8371 detect_info.found = CATEGORY_MASK_ANY;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8372 id = coding_categories[coding_category_undecided].id;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8373 val = Fcons (make_number (id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8374 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8375 else if (highest)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8376 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8377 if (detect_info.found)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8378 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8379 detect_info.found = 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8380 val = Fcons (make_number (this->id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8381 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8382 else
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8383 for (i = 0; i < coding_category_raw_text; i++)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8384 if (! (detect_info.rejected & (1 << coding_priorities[i])))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8385 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8386 detect_info.found = 1 << coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8387 id = coding_categories[coding_priorities[i]].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8388 val = Fcons (make_number (id), Qnil);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8389 break;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8390 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8391 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8392 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8393 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8394 int mask = detect_info.rejected | detect_info.found;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8395 int found = 0;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8396
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8397 for (i = coding_category_raw_text - 1; i >= 0; i--)
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8398 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8399 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8400 if (! (mask & (1 << category)))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8401 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8402 found |= 1 << category;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8403 id = coding_categories[category].id;
90594
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8404 if (id >= 0)
a965377e6761 (detect_coding_system): Fix for handling off
Kenichi Handa <handa@m17n.org>
parents: 90587
diff changeset
8405 val = Fcons (make_number (id), val);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8406 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8407 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8408 for (i = coding_category_raw_text - 1; i >= 0; i--)
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8409 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8410 category = coding_priorities[i];
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8411 if (detect_info.found & (1 << category))
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8412 {
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8413 id = coding_categories[category].id;
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8414 val = Fcons (make_number (id), val);
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8415 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8416 }
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8417 detect_info.found |= found;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8418 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8419 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8420 else if (base_category == coding_category_utf_8_auto)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8421 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8422 if (detect_coding_utf_8 (&coding, &detect_info))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8423 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8424 struct coding_system *this;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8425
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8426 if (detect_info.found & CATEGORY_MASK_UTF_8_SIG)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8427 this = coding_categories + coding_category_utf_8_sig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8428 else
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8429 this = coding_categories + coding_category_utf_8_nosig;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8430 val = Fcons (make_number (this->id), Qnil);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8431 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
8432 }
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8433 else if (base_category == coding_category_utf_16_auto)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8434 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8435 if (detect_coding_utf_16 (&coding, &detect_info))
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8436 {
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8437 struct coding_system *this;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8438
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8439 if (detect_info.found & CATEGORY_MASK_UTF_16_LE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8440 this = coding_categories + coding_category_utf_16_le;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8441 else if (detect_info.found & CATEGORY_MASK_UTF_16_BE)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8442 this = coding_categories + coding_category_utf_16_be;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8443 else if (detect_info.rejected & CATEGORY_MASK_UTF_16_LE_NOSIG)
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8444 this = coding_categories + coding_category_utf_16_be_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8445 else
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8446 this = coding_categories + coding_category_utf_16_le_nosig;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8447 val = Fcons (make_number (this->id), Qnil);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8448 }
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8449 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8450 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8451 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8452 detect_info.found = 1 << XINT (CODING_ATTR_CATEGORY (attrs));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8453 val = Fcons (make_number (coding.id), Qnil);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8454 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8455
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8456 /* Then, detect eol-format if necessary. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8457 {
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8458 int normal_eol = -1, utf_16_be_eol = -1, utf_16_le_eol = -1;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8459 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8460
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8461 if (VECTORP (eol_type))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8462 {
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8463 if (detect_info.found & ~CATEGORY_MASK_UTF_16)
93595
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8464 {
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8465 if (null_byte_found)
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8466 normal_eol = EOL_SEEN_LF;
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8467 else
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8468 normal_eol = detect_eol (coding.source, src_bytes,
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8469 coding_category_raw_text);
ac4d127a841a (CATEGORY_MASK_ANY): Add CATEGORY_MASK_UTF_16_AUTO.
Kenichi Handa <handa@m17n.org>
parents: 93323
diff changeset
8470 }
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8471 if (detect_info.found & (CATEGORY_MASK_UTF_16_BE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8472 | CATEGORY_MASK_UTF_16_BE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8473 utf_16_be_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8474 coding_category_utf_16_be);
89331
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8475 if (detect_info.found & (CATEGORY_MASK_UTF_16_LE
1892a75ffcac (CATEGORY_MASK_RAW_TEXT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 89279
diff changeset
8476 | CATEGORY_MASK_UTF_16_LE_NOSIG))
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8477 utf_16_le_eol = detect_eol (coding.source, src_bytes,
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8478 coding_category_utf_16_le);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8479 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8480 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8481 {
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8482 if (EQ (eol_type, Qunix))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8483 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_LF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8484 else if (EQ (eol_type, Qdos))
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8485 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CRLF;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8486 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8487 normal_eol = utf_16_be_eol = utf_16_le_eol = EOL_SEEN_CR;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8488 }
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8489
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8490 for (tail = val; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8491 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8492 enum coding_category category;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8493 int this_eol;
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8494
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8495 id = XINT (XCAR (tail));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8496 attrs = CODING_ID_ATTRS (id);
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8497 category = XINT (CODING_ATTR_CATEGORY (attrs));
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8498 eol_type = CODING_ID_EOL_TYPE (id);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8499 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8500 {
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8501 if (category == coding_category_utf_16_be
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8502 || category == coding_category_utf_16_be_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8503 this_eol = utf_16_be_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8504 else if (category == coding_category_utf_16_le
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8505 || category == coding_category_utf_16_le_nosig)
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8506 this_eol = utf_16_le_eol;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8507 else
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8508 this_eol = normal_eol;
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8509
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8510 if (this_eol == EOL_SEEN_LF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8511 XSETCAR (tail, AREF (eol_type, 0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8512 else if (this_eol == EOL_SEEN_CRLF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8513 XSETCAR (tail, AREF (eol_type, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8514 else if (this_eol == EOL_SEEN_CR)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8515 XSETCAR (tail, AREF (eol_type, 2));
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8516 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8517 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8518 }
89193
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8519 else
311d061195ef (detect_coding_utf_8): Check incomplete byte sequence.
Kenichi Handa <handa@m17n.org>
parents: 89184
diff changeset
8520 XSETCAR (tail, CODING_ID_NAME (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8521 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8522 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8523
100135
0e17542db552 (detect_coding_system): Initialize utf_16_le_eol to -1, val to
Kenichi Handa <handa@m17n.org>
parents: 100133
diff changeset
8524 return (highest ? (CONSP (val) ? XCAR (val) : Qnil) : val);
42104
d69c2368e549 (DECODE_COMPOSITION_END): Fixed a typo in the last
Sam Steingold <sds@gnu.org>
parents: 42103
diff changeset
8525 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8526
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8527
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8528 DEFUN ("detect-coding-region", Fdetect_coding_region, Sdetect_coding_region,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8529 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8530 doc: /* Detect coding system of the text in the region between START and END.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8531 Return a list of possible coding systems ordered by priority.
102737
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
8532 The coding systems to try and their priorities follows what
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
8533 the function `coding-system-priority-list' (which see) returns.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8534
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8535 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8536 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8537 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8538 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8539
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8540 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8541 highest priority. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8542 (start, end, highest)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8543 Lisp_Object start, end, highest;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8544 {
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8545 int from, to;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8546 int from_byte, to_byte;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8547
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8548 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8549 CHECK_NUMBER_COERCE_MARKER (end);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8550
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8551 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8552 from = XINT (start), to = XINT (end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8553 from_byte = CHAR_TO_BYTE (from);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8554 to_byte = CHAR_TO_BYTE (to);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8555
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8556 if (from < GPT && to >= GPT)
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8557 move_gap_both (to, to_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8558
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8559 return detect_coding_system (BYTE_POS_ADDR (from_byte),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8560 to - from, to_byte - from_byte,
34531
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8561 !NILP (highest),
37f85e931855 (ONE_MORE_BYTE_CHECK_MULTIBYTE): New macro.
Kenichi Handa <handa@m17n.org>
parents: 34197
diff changeset
8562 !NILP (current_buffer
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8563 ->enable_multibyte_characters),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8564 Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8565 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8566
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8567 DEFUN ("detect-coding-string", Fdetect_coding_string, Sdetect_coding_string,
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8568 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8569 doc: /* Detect coding system of the text in STRING.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8570 Return a list of possible coding systems ordered by priority.
102738
41e7ab490f69 (Fdetect_coding_string): Improve the docstrings.
Kenichi Handa <handa@m17n.org>
parents: 102737
diff changeset
8571 The coding systems to try and their priorities follows what
41e7ab490f69 (Fdetect_coding_string): Improve the docstrings.
Kenichi Handa <handa@m17n.org>
parents: 102737
diff changeset
8572 the function `coding-system-priority-list' (which see) returns.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8573
72552
6493d4697ad2 (Fdetect_coding_region, Fdetect_coding_string): Fix
Kenichi Handa <handa@m17n.org>
parents: 72395
diff changeset
8574 If only ASCII characters are found (except for such ISO-2022 control
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8575 characters as ESC), it returns a list of single element `undecided'
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8576 or its subsidiary coding system according to a detected end-of-line
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8577 format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8578
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8579 If optional argument HIGHEST is non-nil, return the coding system of
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8580 highest priority. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8581 (string, highest)
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8582 Lisp_Object string, highest;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8583 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8584 CHECK_STRING (string);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8585
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
8586 return detect_coding_system (SDATA (string),
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
8587 SCHARS (string), SBYTES (string),
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8588 !NILP (highest), STRING_MULTIBYTE (string),
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8589 Qnil);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8590 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8591
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8592
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8593 static INLINE int
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8594 char_encodable_p (c, attrs)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8595 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8596 Lisp_Object attrs;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8597 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8598 Lisp_Object tail;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8599 struct charset *charset;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8600 Lisp_Object translation_table;
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8601
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8602 translation_table = CODING_ATTR_TRANS_TBL (attrs);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
8603 if (! NILP (translation_table))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8604 c = translate_char (translation_table, c);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8605 for (tail = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8606 CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8607 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8608 charset = CHARSET_FROM_ID (XINT (XCAR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8609 if (CHAR_CHARSET_P (c, charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8610 break;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8611 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8612 return (! NILP (tail));
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8613 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8614
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8615
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8616 /* Return a list of coding systems that safely encode the text between
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8617 START and END. If EXCLUDE is non-nil, it is a list of coding
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8618 systems not to check. The returned list doesn't contain any such
88889
4548f224c603 (Ffind_coding_systems_region_internal): Detect an
Kenichi Handa <handa@m17n.org>
parents: 88876
diff changeset
8619 coding systems. In any case, if the text contains only ASCII or is
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8620 unibyte, return t. */
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8621
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8622 DEFUN ("find-coding-systems-region-internal",
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8623 Ffind_coding_systems_region_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8624 Sfind_coding_systems_region_internal, 2, 3, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
8625 doc: /* Internal use only. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8626 (start, end, exclude)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8627 Lisp_Object start, end, exclude;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8628 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8629 Lisp_Object coding_attrs_list, safe_codings;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8630 EMACS_INT start_byte, end_byte;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8631 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8632 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8633 Lisp_Object tail, elt;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8634
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8635 if (STRINGP (start))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8636 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8637 if (!STRING_MULTIBYTE (start)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8638 || SCHARS (start) == SBYTES (start))
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8639 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8640 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8641 end_byte = SBYTES (start);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8642 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8643 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8644 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8645 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8646 CHECK_NUMBER_COERCE_MARKER (end);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8647 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8648 args_out_of_range (start, end);
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8649 if (NILP (current_buffer->enable_multibyte_characters))
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8650 return Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8651 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8652 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8653 if (XINT (end) - XINT (start) == end_byte - start_byte)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8654 return Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8655
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8656 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8657 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8658 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8659 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8660 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8661 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8662 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8663 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8664
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8665 coding_attrs_list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8666 for (tail = Vcoding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8667 if (NILP (exclude)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8668 || NILP (Fmemq (XCAR (tail), exclude)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8669 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8670 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8671
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8672 attrs = AREF (CODING_SYSTEM_SPEC (XCAR (tail)), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8673 if (EQ (XCAR (tail), CODING_ATTR_BASE_NAME (attrs))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8674 && ! EQ (CODING_ATTR_TYPE (attrs), Qundecided))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8675 {
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8676 ASET (attrs, coding_attr_trans_tbl,
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8677 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8678 coding_attrs_list = Fcons (attrs, coding_attrs_list);
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8679 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8680 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8681
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8682 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8683 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8684 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8685 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8686 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8687
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8688 while (p < pend && ASCII_BYTE_P (*p)) p++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8689 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8690
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8691 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8692 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8693 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8694 p++;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8695 else
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8696 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8697 c = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8698
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8699 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8700 for (tail = coding_attrs_list; CONSP (tail);)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8701 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8702 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8703 if (NILP (elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8704 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8705 else if (char_encodable_p (c, elt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8706 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8707 else if (CONSP (XCDR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8708 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8709 XSETCAR (tail, XCAR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8710 XSETCDR (tail, XCDR (XCDR (tail)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8711 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8712 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8713 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8714 XSETCAR (tail, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8715 tail = XCDR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8716 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8717 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8718 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8719 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8720 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8721
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8722 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8723 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8724 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8725 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8726 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8727 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8728 }
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8729 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8730 }
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8731
89905
37e044cc35f6 (Ffind_coding_systems_region_internal): Include raw-text and
Kenichi Handa <handa@m17n.org>
parents: 89892
diff changeset
8732 safe_codings = list2 (Qraw_text, Qno_conversion);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8733 for (tail = coding_attrs_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8734 if (! NILP (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8735 safe_codings = Fcons (CODING_ATTR_BASE_NAME (XCAR (tail)), safe_codings);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8736
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8737 return safe_codings;
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8738 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8739
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
8740
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8741 DEFUN ("unencodable-char-position", Funencodable_char_position,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8742 Sunencodable_char_position, 3, 5, 0,
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8743 doc: /*
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8744 Return position of first un-encodable character in a region.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8745 START and END specify the region and CODING-SYSTEM specifies the
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8746 encoding to check. Return nil if CODING-SYSTEM does encode the region.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8747
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8748 If optional 4th argument COUNT is non-nil, it specifies at most how
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8749 many un-encodable characters to search. In this case, the value is a
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8750 list of positions.
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8751
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8752 If optional 5th argument STRING is non-nil, it is a string to search
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8753 for un-encodable characters. In that case, START and END are indexes
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8754 to the string. */)
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8755 (start, end, coding_system, count, string)
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8756 Lisp_Object start, end, coding_system, count, string;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8757 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8758 int n;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8759 struct coding_system coding;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8760 Lisp_Object attrs, charset_list, translation_table;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8761 Lisp_Object positions;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8762 int from, to;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8763 const unsigned char *p, *stop, *pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8764 int ascii_compatible;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8765
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8766 setup_coding_system (Fcheck_coding_system (coding_system), &coding);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8767 attrs = CODING_ID_ATTRS (coding.id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8768 if (EQ (CODING_ATTR_TYPE (attrs), Qraw_text))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8769 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8770 ascii_compatible = ! NILP (CODING_ATTR_ASCII_COMPAT (attrs));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8771 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8772 translation_table = get_translation_table (attrs, 1, NULL);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8773
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8774 if (NILP (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8775 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8776 validate_region (&start, &end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8777 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8778 to = XINT (end);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8779 if (NILP (current_buffer->enable_multibyte_characters)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8780 || (ascii_compatible
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8781 && (to - from) == (CHAR_TO_BYTE (to) - (CHAR_TO_BYTE (from)))))
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8782 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8783 p = CHAR_POS_ADDR (from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8784 pend = CHAR_POS_ADDR (to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8785 if (from < GPT && to >= GPT)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8786 stop = GPT_ADDR;
48829
f6c59ca557c7 (Funencodable_char_position): Set pend correctly.
Kenichi Handa <handa@m17n.org>
parents: 48230
diff changeset
8787 else
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8788 stop = pend;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8789 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8790 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8791 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8792 CHECK_STRING (string);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8793 CHECK_NATNUM (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8794 CHECK_NATNUM (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8795 from = XINT (start);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8796 to = XINT (end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8797 if (from > to
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8798 || to > SCHARS (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8799 args_out_of_range_3 (string, start, end);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8800 if (! STRING_MULTIBYTE (string))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8801 return Qnil;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8802 p = SDATA (string) + string_char_to_byte (string, from);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8803 stop = pend = SDATA (string) + string_char_to_byte (string, to);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8804 if (ascii_compatible && (to - from) == (pend - p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8805 return Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8806 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8807
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8808 if (NILP (count))
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8809 n = 1;
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8810 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8811 {
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8812 CHECK_NATNUM (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8813 n = XINT (count);
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8814 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8815
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8816 positions = Qnil;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8817 while (1)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8818 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8819 int c;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8820
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8821 if (ascii_compatible)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8822 while (p < stop && ASCII_BYTE_P (*p))
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8823 p++, from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8824 if (p >= stop)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8825 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8826 if (p >= pend)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8827 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8828 stop = pend;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8829 p = GAP_END_ADDR;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8830 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8831
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8832 c = STRING_CHAR_ADVANCE (p);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8833 if (! (ASCII_CHAR_P (c) && ascii_compatible)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8834 && ! char_charset (translate_char (translation_table, c),
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8835 charset_list, NULL))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8836 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8837 positions = Fcons (make_number (from), positions);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8838 n--;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8839 if (n == 0)
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8840 break;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8841 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8842
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8843 from++;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8844 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8845
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8846 return (NILP (count) ? Fcar (positions) : Fnreverse (positions));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8847 }
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8848
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8849
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8850 DEFUN ("check-coding-systems-region", Fcheck_coding_systems_region,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8851 Scheck_coding_systems_region, 3, 3, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8852 doc: /* Check if the region is encodable by coding systems.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8853
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8854 START and END are buffer positions specifying the region.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8855 CODING-SYSTEM-LIST is a list of coding systems to check.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8856
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8857 The value is an alist ((CODING-SYSTEM POS0 POS1 ...) ...), where
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
8858 CODING-SYSTEM is a member of CODING-SYSTEM-LIST and can't encode the
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8859 whole region, POS0, POS1, ... are buffer positions where non-encodable
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8860 characters are found.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8861
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8862 If all coding systems in CODING-SYSTEM-LIST can encode the region, the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8863 value is nil.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8864
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8865 START may be a string. In that case, check if the string is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8866 encodable, and the value contains indices to the string instead of
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8867 buffer positions. END is ignored.
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8868
102058
4f60db600648 (Fcheck_coding_systems_region): Fix test for unibyte
Andreas Schwab <schwab@suse.de>
parents: 102055
diff changeset
8869 If the current buffer (or START if it is a string) is unibyte, the value
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8870 is nil. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8871 (start, end, coding_system_list)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8872 Lisp_Object start, end, coding_system_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8873 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8874 Lisp_Object list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8875 EMACS_INT start_byte, end_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8876 int pos;
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
8877 const unsigned char *p, *pbeg, *pend;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8878 int c;
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8879 Lisp_Object tail, elt, attrs;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8880
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8881 if (STRINGP (start))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8882 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8883 if (!STRING_MULTIBYTE (start)
102058
4f60db600648 (Fcheck_coding_systems_region): Fix test for unibyte
Andreas Schwab <schwab@suse.de>
parents: 102055
diff changeset
8884 || SCHARS (start) == SBYTES (start))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8885 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8886 start_byte = 0;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8887 end_byte = SBYTES (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8888 pos = 0;
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
8889 }
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8890 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8891 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8892 CHECK_NUMBER_COERCE_MARKER (start);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8893 CHECK_NUMBER_COERCE_MARKER (end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8894 if (XINT (start) < BEG || XINT (end) > Z || XINT (start) > XINT (end))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8895 args_out_of_range (start, end);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8896 if (NILP (current_buffer->enable_multibyte_characters))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8897 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8898 start_byte = CHAR_TO_BYTE (XINT (start));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8899 end_byte = CHAR_TO_BYTE (XINT (end));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8900 if (XINT (end) - XINT (start) == end_byte - start_byte)
102055
4d3a5c88cb2b (Fcheck_coding_systems_region): Fix typo; Qt -> Qnil.
Kenichi Handa <handa@m17n.org>
parents: 101943
diff changeset
8901 return Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8902
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8903 if (XINT (start) < GPT && XINT (end) > GPT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8904 {
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8905 if ((GPT - XINT (start)) < (XINT (end) - GPT))
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8906 move_gap_both (XINT (start), start_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8907 else
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8908 move_gap_both (XINT (end), end_byte);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8909 }
89394
6ffca50f25b9 (Fcheck_coding_systems_region): Fix type errors.
Dave Love <fx@gnu.org>
parents: 89373
diff changeset
8910 pos = XINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8911 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8912
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8913 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8914 for (tail = coding_system_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8915 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8916 elt = XCAR (tail);
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8917 attrs = AREF (CODING_SYSTEM_SPEC (elt), 0);
89861
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8918 ASET (attrs, coding_attr_trans_tbl,
7160ded23e55 (get_translation_table): Allow max_lookup to be NULL.
Kenichi Handa <handa@m17n.org>
parents: 89859
diff changeset
8919 get_translation_table (attrs, 1, NULL));
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
8920 list = Fcons (Fcons (elt, Fcons (attrs, Qnil)), list);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8921 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8922
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8923 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8924 p = pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8925 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8926 p = pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8927 pend = p + (end_byte - start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8928
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8929 while (p < pend && ASCII_BYTE_P (*p)) p++, pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8930 while (p < pend && ASCII_BYTE_P (*(pend - 1))) pend--;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8931
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8932 while (p < pend)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8933 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8934 if (ASCII_BYTE_P (*p))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8935 p++;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8936 else
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8937 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8938 c = STRING_CHAR_ADVANCE (p);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8939
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8940 charset_map_loaded = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8941 for (tail = list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8942 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8943 elt = XCDR (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8944 if (! char_encodable_p (c, XCAR (elt)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8945 XSETCDR (elt, Fcons (make_number (pos), XCDR (elt)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8946 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8947 if (charset_map_loaded)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8948 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8949 EMACS_INT p_offset = p - pbeg, pend_offset = pend - pbeg;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8950
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8951 if (STRINGP (start))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
8952 pbeg = SDATA (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8953 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8954 pbeg = BYTE_POS_ADDR (start_byte);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8955 p = pbeg + p_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8956 pend = pbeg + pend_offset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8957 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8958 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8959 pos++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8960 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8961
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8962 tail = list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8963 list = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8964 for (; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8965 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8966 elt = XCAR (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8967 if (CONSP (XCDR (XCDR (elt))))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8968 list = Fcons (Fcons (XCAR (elt), Fnreverse (XCDR (XCDR (elt)))),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8969 list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8970 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8971
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8972 return list;
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8973 }
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8974
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
8975
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
8976 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8977 code_convert_region (start, end, coding_system, dst_object, encodep, norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8978 Lisp_Object start, end, coding_system, dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8979 int encodep, norecord;
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8980 {
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8981 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8982 EMACS_INT from, from_byte, to, to_byte;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8983 Lisp_Object src_object;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8984
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8985 CHECK_NUMBER_COERCE_MARKER (start);
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
8986 CHECK_NUMBER_COERCE_MARKER (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8987 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8988 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8989 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8990 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8991 src_object = Fcurrent_buffer ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8992 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8993 dst_object = src_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8994 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8995 CHECK_BUFFER (dst_object);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
8996
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8997 validate_region (&start, &end);
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
8998 from = XFASTINT (start);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
8999 from_byte = CHAR_TO_BYTE (from);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9000 to = XFASTINT (end);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9001 to_byte = CHAR_TO_BYTE (to);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9002
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9003 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9004 coding.mode |= CODING_MODE_LAST_BLOCK;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9005
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9006 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9007 encode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9008 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9009 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9010 decode_coding_object (&coding, src_object, from, from_byte, to, to_byte,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9011 dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9012 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9013 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9014
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9015 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9016 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9017 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9018 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9019
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9020
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9021 DEFUN ("decode-coding-region", Fdecode_coding_region, Sdecode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9022 3, 4, "r\nzCoding system: ",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9023 doc: /* Decode the current region from the specified coding system.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9024 When called from a program, takes four arguments:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9025 START, END, CODING-SYSTEM, and DESTINATION.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9026 START and END are buffer positions.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9027
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9028 Optional 4th arguments DESTINATION specifies where the decoded text goes.
91083
ff87badce376 (Fdecode_coding_region): Fix typo in docstring.
Kenichi Handa <handa@m17n.org>
parents: 91056
diff changeset
9029 If nil, the region between START and END is replaced by the decoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9030 If buffer, the decoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9031 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
9032 In those cases, the length of the decoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9033 If DESTINATION is t, the decoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9034
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9035 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9036 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9037 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9038 (start, end, coding_system, destination)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9039 Lisp_Object start, end, coding_system, destination;
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9040 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9041 return code_convert_region (start, end, coding_system, destination, 0, 0);
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9042 }
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9043
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9044 DEFUN ("encode-coding-region", Fencode_coding_region, Sencode_coding_region,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9045 3, 4, "r\nzCoding system: ",
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9046 doc: /* Encode the current region by specified coding system.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9047 When called from a program, takes four arguments:
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9048 START, END, CODING-SYSTEM and DESTINATION.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9049 START and END are buffer positions.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9050
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9051 Optional 4th arguments DESTINATION specifies where the encoded text goes.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9052 If nil, the region between START and END is replace by the encoded text.
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9053 If buffer, the encoded text is inserted in that buffer after point (point
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9054 does not move).
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
9055 In those cases, the length of the encoded text is returned.
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9056 If DESTINATION is t, the encoded text is returned.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9057
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9058 This function sets `last-coding-system-used' to the precise coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9059 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95353
96d35f50fe34 (encode_coding_raw_text): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 95345
diff changeset
9060 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9061 (start, end, coding_system, destination)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9062 Lisp_Object start, end, coding_system, destination;
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9063 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9064 return code_convert_region (start, end, coding_system, destination, 1, 0);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9065 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9066
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9067 Lisp_Object
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9068 code_convert_string (string, coding_system, dst_object,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9069 encodep, nocopy, norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9070 Lisp_Object string, coding_system, dst_object;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9071 int encodep, nocopy, norecord;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9072 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9073 struct coding_system coding;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9074 EMACS_INT chars, bytes;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9075
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9076 CHECK_STRING (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9077 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9078 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9079 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9080 Vlast_coding_system_used = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9081 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9082 return (nocopy ? Fcopy_sequence (string) : string);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9083 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9084
70520
b6740a317343 (setup_coding_system): For invalid coding-system, set
Kenichi Handa <handa@m17n.org>
parents: 69995
diff changeset
9085 if (NILP (coding_system))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9086 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9087 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9088 CHECK_CODING_SYSTEM (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9089 if (NILP (dst_object))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9090 dst_object = Qt;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9091 else if (! EQ (dst_object, Qt))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9092 CHECK_BUFFER (dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9093
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9094 setup_coding_system (coding_system, &coding);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9095 coding.mode |= CODING_MODE_LAST_BLOCK;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9096 chars = SCHARS (string);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9097 bytes = SBYTES (string);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9098 if (encodep)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9099 encode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9100 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9101 decode_coding_object (&coding, string, 0, 0, chars, bytes, dst_object);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9102 if (! norecord)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9103 Vlast_coding_system_used = CODING_ID_NAME (coding.id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9104
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9105 return (BUFFERP (dst_object)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9106 ? make_number (coding.produced_char)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9107 : coding.dst_object);
20803
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9108 }
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9109
0fa2183c587d (ENCODE_ISO_CHARACTER): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 20794
diff changeset
9110
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9111 /* Encode or decode STRING according to CODING_SYSTEM.
26847
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9112 Do not set Vlast_coding_system_used.
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9113
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9114 This function is called only from macros DECODE_FILE and
2f17ea330dae Include composite.h.
Kenichi Handa <handa@m17n.org>
parents: 26742
diff changeset
9115 ENCODE_FILE, thus we ignore character composition. */
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9116
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9117 Lisp_Object
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9118 code_convert_string_norecord (string, coding_system, encodep)
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9119 Lisp_Object string, coding_system;
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9120 int encodep;
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9121 {
88430
6418a272b97e * coding.c: Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 88365
diff changeset
9122 return code_convert_string (string, coding_system, Qt, encodep, 0, 1);
22341
572ba933a4bf (code_convert_string_norecord): New function.
Karl Heuer <kwzh@gnu.org>
parents: 22329
diff changeset
9123 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9124
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9125
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9126 DEFUN ("decode-coding-string", Fdecode_coding_string, Sdecode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9127 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9128 doc: /* Decode STRING which is encoded in CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9129
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9130 Optional third arg NOCOPY non-nil means it is OK to return STRING itself
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9131 if the decoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9132
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9133 Optional fourth arg BUFFER non-nil means that the decoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9134 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9135 case, the return value is the length of the decoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9136
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9137 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9138 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9139 not fully specified.) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9140 (string, coding_system, nocopy, buffer)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9141 Lisp_Object string, coding_system, nocopy, buffer;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9142 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9143 return code_convert_string (string, coding_system, buffer,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9144 0, ! NILP (nocopy), 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9145 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9146
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9147 DEFUN ("encode-coding-string", Fencode_coding_string, Sencode_coding_string,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9148 2, 4, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9149 doc: /* Encode STRING to CODING-SYSTEM, and return the result.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9150
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9151 Optional third arg NOCOPY non-nil means it is OK to return STRING
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9152 itself if the encoding operation is trivial.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9153
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9154 Optional fourth arg BUFFER non-nil means that the encoded text is
98992
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9155 inserted in that buffer after point (point does not move). In this
d4659edb9b7b (Fencode_coding_region, Fdecode_coding_region)
Eli Zaretskii <eliz@gnu.org>
parents: 98951
diff changeset
9156 case, the return value is the length of the encoded text.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9157
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9158 This function sets `last-coding-system-used' to the precise coding system
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9159 used (which may be different from CODING-SYSTEM if CODING-SYSTEM is
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9160 not fully specified.) */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9161 (string, coding_system, nocopy, buffer)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9162 Lisp_Object string, coding_system, nocopy, buffer;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9163 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9164 return code_convert_string (string, coding_system, buffer,
88856
13a375bc220d (ENCODE_DESIGNATION, decode_eol)
Dave Love <fx@gnu.org>
parents: 88845
diff changeset
9165 1, ! NILP (nocopy), 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9166 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9167
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9168
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9169 DEFUN ("decode-sjis-char", Fdecode_sjis_char, Sdecode_sjis_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9170 doc: /* Decode a Japanese character which has CODE in shift_jis encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9171 Return the corresponding character. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9172 (code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9173 Lisp_Object code;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9174 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9175 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9176 struct charset *charset_roman, *charset_kanji, *charset_kana, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9177 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9178
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9179 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9180 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9181 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9182 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9183
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9184 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9185 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9186 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9187
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9188 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9189 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9190 charset_kana = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9191 charset_kanji = CHARSET_FROM_ID (XINT (XCAR (val)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9192
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9193 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9194 charset = charset_roman;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9195 else if (c >= 0xA0 && c < 0xDF)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9196 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9197 charset = charset_kana;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9198 c -= 0x80;
24065
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9199 }
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9200 else
7e291dea6141 (Fdecode_sjis_char): Decode Japanese Katakana character
Kenichi Handa <handa@m17n.org>
parents: 24056
diff changeset
9201 {
88497
d2b9e0d4c2f6 (Fdecode_sjis_char): Fix typo (0x7F->0xFF). Fix the
Kenichi Handa <handa@m17n.org>
parents: 88485
diff changeset
9202 int s1 = c >> 8, s2 = c & 0xFF;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9203
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9204 if (s1 < 0x81 || (s1 > 0x9F && s1 < 0xE0) || s1 > 0xEF
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9205 || s2 < 0x40 || s2 == 0x7F || s2 > 0xFC)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9206 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9207 SJIS_TO_JIS (c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9208 charset = charset_kanji;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9209 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9210 c = DECODE_CHAR (charset, c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9211 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9212 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9213 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9214 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9215
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9216
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9217 DEFUN ("encode-sjis-char", Fencode_sjis_char, Sencode_sjis_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
9218 doc: /* Encode a Japanese character CH to shift_jis encoding.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9219 Return the corresponding code in SJIS. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9220 (ch)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9221 Lisp_Object ch;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9222 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9223 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9224 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9225 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9226 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9227
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9228 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9229 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9230 CHECK_CODING_SYSTEM_GET_SPEC (Vsjis_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9231 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9232
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9233 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9234 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9235 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9236
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9237 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9238 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9239 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9240 error ("Can't encode by shift_jis encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9241 JIS_TO_SJIS (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9242
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9243 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9244 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9245
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9246 DEFUN ("decode-big5-char", Fdecode_big5_char, Sdecode_big5_char, 1, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9247 doc: /* Decode a Big5 character which has CODE in BIG5 coding system.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9248 Return the corresponding character. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9249 (code)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9250 Lisp_Object code;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9251 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9252 Lisp_Object spec, attrs, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9253 struct charset *charset_roman, *charset_big5, *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9254 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9255
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9256 CHECK_NATNUM (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9257 c = XFASTINT (code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9258 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9259 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9260
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9261 if (ASCII_BYTE_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9262 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9263 return code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9264
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9265 val = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9266 charset_roman = CHARSET_FROM_ID (XINT (XCAR (val))), val = XCDR (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9267 charset_big5 = CHARSET_FROM_ID (XINT (XCAR (val)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9268
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9269 if (c <= 0x7F)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9270 charset = charset_roman;
24324
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
9271 else
2eec590faf26 (Fdecode_sjis_char, Fencode_sjis_char): Hanlde
Kenichi Handa <handa@m17n.org>
parents: 24316
diff changeset
9272 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9273 int b1 = c >> 8, b2 = c & 0x7F;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9274 if (b1 < 0xA1 || b1 > 0xFE
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9275 || b2 < 0x40 || (b2 > 0x7E && b2 < 0xA1) || b2 > 0xFE)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9276 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9277 charset = charset_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9278 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9279 c = DECODE_CHAR (charset, (unsigned )c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9280 if (c < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9281 error ("Invalid code: %d", code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9282 return make_number (c);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9283 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9284
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9285 DEFUN ("encode-big5-char", Fencode_big5_char, Sencode_big5_char, 1, 1, 0,
73949
0d1207b43a5b (Fencode_sjis_char, Fencode_big5_char): Improve argument/docstring consistency.
Juanma Barranquero <lekktu@gmail.com>
parents: 72552
diff changeset
9286 doc: /* Encode the Big5 character CH to BIG5 coding system.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9287 Return the corresponding character code in Big5. */)
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9288 (ch)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9289 Lisp_Object ch;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9290 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9291 Lisp_Object spec, attrs, charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9292 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9293 int c;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9294 unsigned code;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9295
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9296 CHECK_CHARACTER (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9297 c = XFASTINT (ch);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9298 CHECK_CODING_SYSTEM_GET_SPEC (Vbig5_coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9299 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9300 if (ASCII_CHAR_P (c)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9301 && ! NILP (CODING_ATTR_ASCII_COMPAT (attrs)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9302 return ch;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9303
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9304 charset_list = CODING_ATTR_CHARSET_LIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9305 charset = char_charset (c, charset_list, &code);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9306 if (code == CHARSET_INVALID_CODE (charset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9307 error ("Can't encode by Big5 encoding: %d", c);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9308
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9309 return make_number (code);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9310 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9311
20680
dd46027e8412 (code_convert_region): Always count chars inserted
Richard M. Stallman <rms@gnu.org>
parents: 20668
diff changeset
9312
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9313 DEFUN ("set-terminal-coding-system-internal", Fset_terminal_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9314 Sset_terminal_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9315 doc: /* Internal use only. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9316 (coding_system, terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9317 Lisp_Object coding_system;
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9318 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9319 {
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9320 struct coding_system *terminal_coding = TERMINAL_TERMINAL_CODING (get_terminal (terminal, 1));
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9321 CHECK_SYMBOL (coding_system);
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9322 setup_coding_system (Fcheck_coding_system (coding_system), terminal_coding);
20150
402b6e5f4b58 (encode_designation_at_bol): Fix bug of finding graphic
Kenichi Handa <handa@m17n.org>
parents: 20105
diff changeset
9323 /* We had better not send unsafe characters to terminal. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9324 terminal_coding->mode |= CODING_MODE_SAFE_ENCODING;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9325 /* Characer composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9326 terminal_coding->common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9327 terminal_coding->src_multibyte = 1;
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9328 terminal_coding->dst_multibyte = 0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9329 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9330 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9331
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9332 DEFUN ("set-safe-terminal-coding-system-internal",
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9333 Fset_safe_terminal_coding_system_internal,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9334 Sset_safe_terminal_coding_system_internal, 1, 1, 0,
41006
fd83ec62a495 Doc fix.
Pavel Janík <Pavel@Janik.cz>
parents: 40842
diff changeset
9335 doc: /* Internal use only. */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9336 (coding_system)
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9337 Lisp_Object coding_system;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9338 {
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9339 CHECK_SYMBOL (coding_system);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9340 setup_coding_system (Fcheck_coding_system (coding_system),
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9341 &safe_terminal_coding);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9342 /* Characer composition should be disabled. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9343 safe_terminal_coding.common_flags &= ~CODING_ANNOTATE_COMPOSITION_MASK;
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9344 safe_terminal_coding.src_multibyte = 1;
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
9345 safe_terminal_coding.dst_multibyte = 0;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9346 return Qnil;
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9347 }
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
9348
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9349 DEFUN ("terminal-coding-system", Fterminal_coding_system,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9350 Sterminal_coding_system, 0, 1, 0,
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9351 doc: /* Return coding system specified for terminal output on the given terminal.
103052
e68707cf48a5 * keyboard.c (Fset_input_meta_mode): Doc fix.
Chong Yidong <cyd@stupidchicken.com>
parents: 103035
diff changeset
9352 TERMINAL may be a terminal object, a frame, or nil for the selected
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9353 frame's terminal device. */)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9354 (terminal)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9355 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9356 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9357 struct coding_system *terminal_coding
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9358 = TERMINAL_TERMINAL_CODING (get_terminal (terminal, 1));
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9359 Lisp_Object coding_system = CODING_ID_NAME (terminal_coding->id);
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9360
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
9361 /* For backward compatibility, return nil if it is `undecided'. */
90359
041f75914d0c (produce_composition): Compare charbuf[i] instead of
Kenichi Handa <handa@m17n.org>
parents: 90354
diff changeset
9362 return (! EQ (coding_system, Qundecided) ? coding_system : Qnil);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9363 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9364
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
9365 DEFUN ("set-keyboard-coding-system-internal", Fset_keyboard_coding_system_internal,
83298
ed09a89e2b25 Fix UTF-8 tty input when first frame is an X frame. Steps towards multiple tty locale support.
Karoly Lorentey <lorentey@elte.hu>
parents: 83292
diff changeset
9366 Sset_keyboard_coding_system_internal, 1, 2, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9367 doc: /* Internal use only. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9368 (coding_system, terminal)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9369 Lisp_Object coding_system;
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9370 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9371 {
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9372 struct terminal *t = get_terminal (terminal, 1);
40656
cdfd4d09b79a Update usage of CHECK_ macros (remove unused second argument).
Pavel Janík <Pavel@Janik.cz>
parents: 40461
diff changeset
9373 CHECK_SYMBOL (coding_system);
83127
5182815e0ee1 Make terminal_coding and keyboard_coding display-local.
Karoly Lorentey <lorentey@elte.hu>
parents: 54320
diff changeset
9374 setup_coding_system (Fcheck_coding_system (coding_system),
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9375 TERMINAL_KEYBOARD_CODING (t));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9376 /* Characer composition should be disabled. */
91041
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9377 TERMINAL_KEYBOARD_CODING (t)->common_flags
bdb3fe0ba9fa Merge from emacs--devo--0
Miles Bader <miles@gnu.org>
parents: 90996 84646
diff changeset
9378 &= ~CODING_ANNOTATE_COMPOSITION_MASK;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9379 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9380 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9381
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9382 DEFUN ("keyboard-coding-system",
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9383 Fkeyboard_coding_system, Skeyboard_coding_system, 0, 1, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9384 doc: /* Return coding system specified for decoding keyboard input. */)
83431
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9385 (terminal)
76396de7f50a Rename `struct device' to `struct terminal'. Rename some terminal-related functions similarly.
Karoly Lorentey <lorentey@elte.hu>
parents: 83423
diff changeset
9386 Lisp_Object terminal;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9387 {
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9388 return CODING_ID_NAME (TERMINAL_KEYBOARD_CODING
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9389 (get_terminal (terminal, 1))->id);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9390 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9391
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9392
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
9393 DEFUN ("find-operation-coding-system", Ffind_operation_coding_system,
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
9394 Sfind_operation_coding_system, 1, MANY, 0,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9395 doc: /* Choose a coding system for an operation based on the target name.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9396 The value names a pair of coding systems: (DECODING-SYSTEM . ENCODING-SYSTEM).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9397 DECODING-SYSTEM is the coding system to use for decoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9398 \(in case OPERATION does decoding), and ENCODING-SYSTEM is the coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9399 for encoding (in case OPERATION does encoding).
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9400
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9401 The first argument OPERATION specifies an I/O primitive:
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9402 For file I/O, `insert-file-contents' or `write-region'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9403 For process I/O, `call-process', `call-process-region', or `start-process'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9404 For network I/O, `open-network-stream'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9405
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9406 The remaining arguments should be the same arguments that were passed
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9407 to the primitive. Depending on which primitive, one of those arguments
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9408 is selected as the TARGET. For example, if OPERATION does file I/O,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9409 whichever argument specifies the file name is TARGET.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9410
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9411 TARGET has a meaning which depends on OPERATION:
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9412 For file I/O, TARGET is a file name (except for the special case below).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9413 For process I/O, TARGET is a process name.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9414 For network I/O, TARGET is a service name or a port number.
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9415
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9416 This function looks up what is specified for TARGET in
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9417 `file-coding-system-alist', `process-coding-system-alist',
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9418 or `network-coding-system-alist' depending on OPERATION.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9419 They may specify a coding system, a cons of coding systems,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9420 or a function symbol to call.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9421 In the last case, we call the function with one argument,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9422 which is a list of all the arguments given to this function.
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
9423 If the function can't decide a coding system, it can return
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
9424 `undecided' so that the normal code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9425
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9426 If OPERATION is `insert-file-contents', the argument corresponding to
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9427 TARGET may be a cons (FILENAME . BUFFER). In that case, FILENAME is a
71084
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
9428 file name to look up, and BUFFER is a buffer that contains the file's
ccef92f2f7f8 (Ffind_operation_coding_system): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 71070
diff changeset
9429 contents (not yet decoded). If `file-coding-system-alist' specifies a
71070
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
9430 function to call for FILENAME, that function should examine the
0c8ac7192244 (Ffind_operation_coding_system): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents: 71039
diff changeset
9431 contents of BUFFER instead of reading the file.
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9432
78152
5e5f359984e5 (Ffind_operation_coding_system): Doc fix.
Juanma Barranquero <lekktu@gmail.com>
parents: 75348
diff changeset
9433 usage: (find-operation-coding-system OPERATION ARGUMENTS...) */)
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
9434 (nargs, args)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9435 int nargs;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9436 Lisp_Object *args;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9437 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9438 Lisp_Object operation, target_idx, target, val;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9439 register Lisp_Object chain;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9440
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9441 if (nargs < 2)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9442 error ("Too few arguments");
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9443 operation = args[0];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9444 if (!SYMBOLP (operation)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9445 || !INTEGERP (target_idx = Fget (operation, Qtarget_idx)))
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
9446 error ("Invalid first argument");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9447 if (nargs < 1 + XINT (target_idx))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9448 error ("Too few arguments for operation: %s",
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
9449 SDATA (SYMBOL_NAME (operation)));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9450 target = args[XINT (target_idx) + 1];
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9451 if (!(STRINGP (target)
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9452 || (EQ (operation, Qinsert_file_contents) && CONSP (target)
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9453 && STRINGP (XCAR (target)) && BUFFERP (XCDR (target)))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9454 || (EQ (operation, Qopen_network_stream) && INTEGERP (target))))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9455 error ("Invalid %dth argument", XINT (target_idx) + 1);
70948
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9456 if (CONSP (target))
7ea8b1c11d80 (Ffind_operation_coding_system): Allow (FILENAME . BUFFER) in TARGET.
Kenichi Handa <handa@m17n.org>
parents: 70704
diff changeset
9457 target = XCAR (target);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9458
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9459 chain = ((EQ (operation, Qinsert_file_contents)
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9460 || EQ (operation, Qwrite_region))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9461 ? Vfile_coding_system_alist
18613
614b916ff5bf Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents: 18536
diff changeset
9462 : (EQ (operation, Qopen_network_stream)
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9463 ? Vnetwork_coding_system_alist
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9464 : Vprocess_coding_system_alist));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9465 if (NILP (chain))
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9466 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9467
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9468 for (; CONSP (chain); chain = XCDR (chain))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9469 {
19747
bed06df9cbc5 (setup_coding_system, Ffind_operation_coding_system)
Richard M. Stallman <rms@gnu.org>
parents: 19743
diff changeset
9470 Lisp_Object elt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9471
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9472 elt = XCAR (chain);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9473 if (CONSP (elt)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9474 && ((STRINGP (target)
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9475 && STRINGP (XCAR (elt))
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9476 && fast_string_match (XCAR (elt), target) >= 0)
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9477 || (INTEGERP (target) && EQ (target, XCAR (elt)))))
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9478 {
25662
0a7261c1d487 Use XCAR, XCDR, and XFLOAT_DATA instead of explicit member access.
Ken Raeburn <raeburn@raeburn.org>
parents: 25370
diff changeset
9479 val = XCDR (elt);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9480 /* Here, if VAL is both a valid coding system and a valid
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9481 function symbol, we return VAL as a coding system. */
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9482 if (CONSP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9483 return val;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9484 if (! SYMBOLP (val))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9485 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9486 if (! NILP (Fcoding_system_p (val)))
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9487 return Fcons (val, val);
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9488 if (! NILP (Ffboundp (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9489 {
72188
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9490 /* We use call1 rather than safe_call1
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9491 so as to get bug reports about functions called here
6100ca974994 Comment change.
Richard M. Stallman <rms@gnu.org>
parents: 72180
diff changeset
9492 which don't handle the current interface. */
72180
f3bc55b96df5 (Ffind_operation_coding_system): Revert the change from 2006-05-29.
Eli Zaretskii <eliz@gnu.org>
parents: 71972
diff changeset
9493 val = call1 (val, Flist (nargs, args));
19763
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9494 if (CONSP (val))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9495 return val;
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9496 if (SYMBOLP (val) && ! NILP (Fcoding_system_p (val)))
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9497 return Fcons (val, val);
ab2fd2c85986 (Ffind_operation_coding_system): If a function in
Kenichi Handa <handa@m17n.org>
parents: 19758
diff changeset
9498 }
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9499 return Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
9500 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9501 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9502 return Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9503 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
9504
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9505 DEFUN ("set-coding-system-priority", Fset_coding_system_priority,
88845
64b8f6168269 (Fset_coding_system_priority): Allow null arg list.
Dave Love <fx@gnu.org>
parents: 88771
diff changeset
9506 Sset_coding_system_priority, 0, MANY, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9507 doc: /* Assign higher priority to the coding systems given as arguments.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9508 If multiple coding systems belong to the same category,
89519
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
9509 all but the first one are ignored.
040a08a2a879 (Fread_coding_system): Fix arg of XSETSTRING.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
9510
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
9511 usage: (set-coding-system-priority &rest coding-systems) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9512 (nargs, args)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9513 int nargs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9514 Lisp_Object *args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9515 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9516 int i, j;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9517 int changed[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9518 enum coding_category priorities[coding_category_max];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9519
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9520 bzero (changed, sizeof changed);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9521
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9522 for (i = j = 0; i < nargs; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9523 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9524 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9525 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9526
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9527 CHECK_CODING_SYSTEM_GET_SPEC (args[i], spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9528 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9529 category = XINT (CODING_ATTR_CATEGORY (attrs));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9530 if (changed[category])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9531 /* Ignore this coding system because a coding system of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9532 same category already had a higher priority. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9533 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9534 changed[category] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9535 priorities[j++] = category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9536 if (coding_categories[category].id >= 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9537 && ! EQ (args[i], CODING_ID_NAME (coding_categories[category].id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9538 setup_coding_system (args[i], &coding_categories[category]);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9539 Fset (AREF (Vcoding_category_table, category), args[i]);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9540 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9541
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9542 /* Now we have decided top J priorities. Reflect the order of the
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9543 original priorities to the remaining priorities. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9544
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9545 for (i = j, j = 0; i < coding_category_max; i++, j++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9546 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9547 while (j < coding_category_max
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9548 && changed[coding_priorities[j]])
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9549 j++;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9550 if (j == coding_category_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9551 abort ();
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9552 priorities[i] = coding_priorities[j];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9553 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9554
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9555 bcopy (priorities, coding_priorities, sizeof priorities);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9556
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9557 /* Update `coding-category-list'. */
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9558 Vcoding_category_list = Qnil;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9559 for (i = coding_category_max - 1; i >= 0; i--)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9560 Vcoding_category_list
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9561 = Fcons (AREF (Vcoding_category_table, priorities[i]),
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
9562 Vcoding_category_list);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9563
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9564 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9565 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9566
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9567 DEFUN ("coding-system-priority-list", Fcoding_system_priority_list,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9568 Scoding_system_priority_list, 0, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9569 doc: /* Return a list of coding systems ordered by their priorities.
102737
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9570 The list contains a subset of coding systems; i.e. coding systems
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9571 assigned to each coding category (see `coding-category-list').
f556415c326b (Fdetect_coding_region, Fcoding_system_priority_list): Improve the
Kenichi Handa <handa@m17n.org>
parents: 102422
diff changeset
9572
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
9573 HIGHESTP non-nil means just return the highest priority one. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9574 (highestp)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9575 Lisp_Object highestp;
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9576 {
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
9577 int i;
22954
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9578 Lisp_Object val;
928b337d953b Avoid using initializers for Lisp_Object.
Richard M. Stallman <rms@gnu.org>
parents: 22874
diff changeset
9579
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9580 for (i = 0, val = Qnil; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9581 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9582 enum coding_category category = coding_priorities[i];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9583 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9584 Lisp_Object attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9585
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9586 if (id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9587 continue;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9588 attrs = CODING_ID_ATTRS (id);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9589 if (! NILP (highestp))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9590 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9591 val = Fcons (CODING_ATTR_BASE_NAME (attrs), val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9592 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9593 return Fnreverse (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9594 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9595
88631
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
9596 static char *suffixes[] = { "-unix", "-dos", "-mac" };
780b91d4a7e5 (setup_iso_safe_charsets): Fix arg decl for K&R.
Dave Love <fx@gnu.org>
parents: 88607
diff changeset
9597
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9598 static Lisp_Object
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9599 make_subsidiaries (base)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9600 Lisp_Object base;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9601 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9602 Lisp_Object subsidiaries;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9603 int base_name_len = SBYTES (SYMBOL_NAME (base));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9604 char *buf = (char *) alloca (base_name_len + 6);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9605 int i;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9606
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9607 bcopy (SDATA (SYMBOL_NAME (base)), buf, base_name_len);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9608 subsidiaries = Fmake_vector (make_number (3), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9609 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9610 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9611 bcopy (suffixes[i], buf + base_name_len, strlen (suffixes[i]) + 1);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9612 ASET (subsidiaries, i, intern (buf));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9613 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9614 return subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9615 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9616
22226
557fac086b1b (ascii_skip_code): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22186
diff changeset
9617
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
9618 DEFUN ("define-coding-system-internal", Fdefine_coding_system_internal,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9619 Sdefine_coding_system_internal, coding_arg_max, MANY, 0,
88544
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9620 doc: /* For internal use only.
f464d728344c (Vchar_coding_system_table, Qchar_coding_system):
Dave Love <fx@gnu.org>
parents: 88510
diff changeset
9621 usage: (define-coding-system-internal ...) */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9622 (nargs, args)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9623 int nargs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9624 Lisp_Object *args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9625 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9626 Lisp_Object name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9627 Lisp_Object spec_vec; /* [ ATTRS ALIASE EOL_TYPE ] */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9628 Lisp_Object attrs; /* Vector of attributes. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9629 Lisp_Object eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9630 Lisp_Object aliases;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9631 Lisp_Object coding_type, charset_list, safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9632 enum coding_category category;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9633 Lisp_Object tail, val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9634 int max_charset_id = 0;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9635 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9636
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9637 if (nargs < coding_arg_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9638 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9639
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9640 attrs = Fmake_vector (make_number (coding_attr_last_index), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9641
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9642 name = args[coding_arg_name];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9643 CHECK_SYMBOL (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9644 CODING_ATTR_BASE_NAME (attrs) = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9645
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9646 val = args[coding_arg_mnemonic];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9647 if (! STRINGP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9648 CHECK_CHARACTER (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9649 CODING_ATTR_MNEMONIC (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9650
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9651 coding_type = args[coding_arg_coding_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9652 CHECK_SYMBOL (coding_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9653 CODING_ATTR_TYPE (attrs) = coding_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9654
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9655 charset_list = args[coding_arg_charset_list];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9656 if (SYMBOLP (charset_list))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9657 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9658 if (EQ (charset_list, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9659 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9660 if (! EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9661 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9662 charset_list = Viso_2022_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9663 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9664 else if (EQ (charset_list, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9665 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9666 if (! EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9667 error ("Invalid charset-list");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9668 charset_list = Vemacs_mule_charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9669 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9670 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9671 if (max_charset_id < XFASTINT (XCAR (tail)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9672 max_charset_id = XFASTINT (XCAR (tail));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9673 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9674 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9675 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9676 charset_list = Fcopy_sequence (charset_list);
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9677 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9678 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9679 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9680
91046
35069180a991 Fix up multi-tty merge
Miles Bader <miles@gnu.org>
parents: 91041
diff changeset
9681 val = XCAR (tail);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9682 CHECK_CHARSET_GET_CHARSET (val, charset);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9683 if (EQ (coding_type, Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9684 ? CHARSET_ISO_FINAL (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9685 : EQ (coding_type, Qemacs_mule)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9686 ? CHARSET_EMACS_MULE_ID (charset) < 0
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9687 : 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9688 error ("Can't handle charset `%s'",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9689 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9690
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9691 XSETCAR (tail, make_number (charset->id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9692 if (max_charset_id < charset->id)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9693 max_charset_id = charset->id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9694 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9695 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9696 CODING_ATTR_CHARSET_LIST (attrs) = charset_list;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9697
102186
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
9698 safe_charsets = make_uninit_string (max_charset_id + 1);
a12d39ca6870 * coding.h (struct coding_system): Make safe_charsets a pointer to
Andreas Schwab <schwab@suse.de>
parents: 102115
diff changeset
9699 memset (SDATA (safe_charsets), 255, max_charset_id + 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9700 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9701 SSET (safe_charsets, XFASTINT (XCAR (tail)), 0);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9702 CODING_ATTR_SAFE_CHARSETS (attrs) = safe_charsets;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9703
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9704 CODING_ATTR_ASCII_COMPAT (attrs) = args[coding_arg_ascii_compatible_p];
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9705
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9706 val = args[coding_arg_decode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9707 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9708 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9709 CODING_ATTR_DECODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9710
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9711 val = args[coding_arg_encode_translation_table];
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
9712 if (! CHAR_TABLE_P (val) && ! CONSP (val))
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9713 CHECK_SYMBOL (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9714 CODING_ATTR_ENCODE_TBL (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9715
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9716 val = args[coding_arg_post_read_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9717 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9718 CODING_ATTR_POST_READ (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9719
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9720 val = args[coding_arg_pre_write_conversion];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9721 CHECK_SYMBOL (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9722 CODING_ATTR_PRE_WRITE (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9723
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9724 val = args[coding_arg_default_char];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9725 if (NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9726 CODING_ATTR_DEFAULT_CHAR (attrs) = make_number (' ');
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9727 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9728 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9729 CHECK_CHARACTER (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9730 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9731 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9732
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9733 val = args[coding_arg_for_unibyte];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9734 CODING_ATTR_FOR_UNIBYTE (attrs) = NILP (val) ? Qnil : Qt;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9735
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9736 val = args[coding_arg_plist];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9737 CHECK_LIST (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9738 CODING_ATTR_PLIST (attrs) = val;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9739
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9740 if (EQ (coding_type, Qcharset))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9741 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9742 /* Generate a lisp vector of 256 elements. Each element is nil,
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9743 integer, or a list of charset IDs.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9744
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9745 If Nth element is nil, the byte code N is invalid in this
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9746 coding system.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9747
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9748 If Nth element is a number NUM, N is the first byte of a
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9749 charset whose ID is NUM.
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9750
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9751 If Nth element is a list of charset IDs, N is the first byte
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9752 of one of them. The list is sorted by dimensions of the
89648
d5641a606e08 (Fdefine_coding_system_internal): Fix checking of ascii compatibility.
Kenichi Handa <handa@m17n.org>
parents: 89644
diff changeset
9753 charsets. A charset of smaller dimension comes firtst. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9754 val = Fmake_vector (make_number (256), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9755
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9756 for (tail = charset_list; CONSP (tail); tail = XCDR (tail))
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9757 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9758 struct charset *charset = CHARSET_FROM_ID (XFASTINT (XCAR (tail)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9759 int dim = CHARSET_DIMENSION (charset);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9760 int idx = (dim - 1) * 4;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9761
89653
cbaa9fd1aa5c (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89648
diff changeset
9762 if (CHARSET_ASCII_COMPATIBLE_P (charset))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9763 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9764
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9765 for (i = charset->code_space[idx];
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9766 i <= charset->code_space[idx + 1]; i++)
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9767 {
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9768 Lisp_Object tmp, tmp2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9769 int dim2;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9770
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9771 tmp = AREF (val, i);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9772 if (NILP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9773 tmp = XCAR (tail);
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9774 else if (NUMBERP (tmp))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9775 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9776 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (tmp)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9777 if (dim < dim2)
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9778 tmp = Fcons (XCAR (tail), Fcons (tmp, Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9779 else
88607
18436bf3d6dd (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 88598
diff changeset
9780 tmp = Fcons (tmp, Fcons (XCAR (tail), Qnil));
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9781 }
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9782 else
88597
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9783 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9784 for (tmp2 = tmp; CONSP (tmp2); tmp2 = XCDR (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9785 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9786 dim2 = CHARSET_DIMENSION (CHARSET_FROM_ID (XFASTINT (XCAR (tmp2))));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9787 if (dim < dim2)
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9788 break;
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9789 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9790 if (NILP (tmp2))
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9791 tmp = nconc2 (tmp, Fcons (XCAR (tail), Qnil));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9792 else
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9793 {
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9794 XSETCDR (tmp2, Fcons (XCAR (tmp2), XCDR (tmp2)));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9795 XSETCAR (tmp2, XCAR (tail));
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9796 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9797 }
74b74f59bc09 (decode_coding_charset): Adjusted for the change of
Kenichi Handa <handa@m17n.org>
parents: 88587
diff changeset
9798 ASET (val, i, tmp);
88477
5f974cbba7b3 (coding_set_source): Delete the local variable beg_byte.
Kenichi Handa <handa@m17n.org>
parents: 88473
diff changeset
9799 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9800 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9801 ASET (attrs, coding_attr_charset_valids, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9802 category = coding_category_charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9803 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9804 else if (EQ (coding_type, Qccl))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9805 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9806 Lisp_Object valids;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9807
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9808 if (nargs < coding_arg_ccl_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9809 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9810
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9811 val = args[coding_arg_ccl_decoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9812 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9813 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9814 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9815 ASET (attrs, coding_attr_ccl_decoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9816
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9817 val = args[coding_arg_ccl_encoder];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9818 CHECK_CCL_PROGRAM (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9819 if (VECTORP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9820 val = Fcopy_sequence (val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9821 ASET (attrs, coding_attr_ccl_encoder, val);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9822
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9823 val = args[coding_arg_ccl_valids];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9824 valids = Fmake_string (make_number (256), make_number (0));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9825 for (tail = val; !NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9826 {
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9827 int from, to;
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9828
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9829 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9830 if (INTEGERP (val))
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9831 {
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9832 from = to = XINT (val);
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9833 if (from < 0 || from > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9834 args_out_of_range_3 (val, make_number (0), make_number (255));
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9835 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9836 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9837 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9838 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9839 CHECK_NATNUM_CAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9840 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9841 from = XINT (XCAR (val));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9842 if (from > 255)
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9843 args_out_of_range_3 (XCAR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9844 make_number (0), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9845 to = XINT (XCDR (val));
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9846 if (to < from || to > 255)
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9847 args_out_of_range_3 (XCDR (val),
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9848 XCAR (val), make_number (255));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9849 }
89373
4cc9e57fcabc (decode_coding_ccl, encode_coding_ccl): Call ccl_driver
Kenichi Handa <handa@m17n.org>
parents: 89331
diff changeset
9850 for (i = from; i <= to; i++)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9851 SSET (valids, i, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9852 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9853 ASET (attrs, coding_attr_ccl_valids, valids);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9854
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9855 category = coding_category_ccl;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9856 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9857 else if (EQ (coding_type, Qutf_16))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9858 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9859 Lisp_Object bom, endian;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9860
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9861 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9862
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9863 if (nargs < coding_arg_utf16_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9864 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9865
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9866 bom = args[coding_arg_utf16_bom];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9867 if (! NILP (bom) && ! EQ (bom, Qt))
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9868 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9869 CHECK_CONS (bom);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9870 val = XCAR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9871 CHECK_CODING_SYSTEM (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9872 val = XCDR (bom);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9873 CHECK_CODING_SYSTEM (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9874 }
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
9875 ASET (attrs, coding_attr_utf_bom, bom);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9876
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9877 endian = args[coding_arg_utf16_endian];
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9878 CHECK_SYMBOL (endian);
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9879 if (NILP (endian))
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9880 endian = Qbig;
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9881 else if (! EQ (endian, Qbig) && ! EQ (endian, Qlittle))
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9882 error ("Invalid endian: %s", SDATA (SYMBOL_NAME (endian)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9883 ASET (attrs, coding_attr_utf_16_endian, endian);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9884
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9885 category = (CONSP (bom)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9886 ? coding_category_utf_16_auto
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9887 : NILP (bom)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9888 ? (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9889 ? coding_category_utf_16_be_nosig
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9890 : coding_category_utf_16_le_nosig)
89420
c3e67ce6ee0f (Qsignature, Qendian): Delete these variables.
Kenichi Handa <handa@m17n.org>
parents: 89418
diff changeset
9891 : (EQ (endian, Qbig)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9892 ? coding_category_utf_16_be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9893 : coding_category_utf_16_le));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9894 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9895 else if (EQ (coding_type, Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9896 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9897 Lisp_Object initial, reg_usage, request, flags;
89442
7349f4473e7f (detected_mask): Delete unused variable.
Kenichi Handa <handa@m17n.org>
parents: 89429
diff changeset
9898 int i;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9899
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9900 if (nargs < coding_arg_iso2022_max)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9901 goto short_args;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9902
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9903 initial = Fcopy_sequence (args[coding_arg_iso2022_initial]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9904 CHECK_VECTOR (initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9905 for (i = 0; i < 4; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9906 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9907 val = Faref (initial, make_number (i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9908 if (! NILP (val))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9909 {
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9910 struct charset *charset;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9911
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9912 CHECK_CHARSET_GET_CHARSET (val, charset);
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9913 ASET (initial, i, make_number (CHARSET_ID (charset)));
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9914 if (i == 0 && CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9915 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9916 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9917 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9918 ASET (initial, i, make_number (-1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9919 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9920
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9921 reg_usage = args[coding_arg_iso2022_reg_usage];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9922 CHECK_CONS (reg_usage);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9923 CHECK_NUMBER_CAR (reg_usage);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9924 CHECK_NUMBER_CDR (reg_usage);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9925
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9926 request = Fcopy_sequence (args[coding_arg_iso2022_request]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9927 for (tail = request; ! NILP (tail); tail = Fcdr (tail))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9928 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9929 int id;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9930 Lisp_Object tmp;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9931
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9932 val = Fcar (tail);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9933 CHECK_CONS (val);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9934 tmp = XCAR (val);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9935 CHECK_CHARSET_GET_ID (tmp, id);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9936 CHECK_NATNUM_CDR (val);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9937 if (XINT (XCDR (val)) >= 4)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9938 error ("Invalid graphic register number: %d", XINT (XCDR (val)));
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9939 XSETCAR (val, make_number (id));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9940 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9941
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9942 flags = args[coding_arg_iso2022_flags];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9943 CHECK_NATNUM (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9944 i = XINT (flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9945 if (EQ (args[coding_arg_charset_list], Qiso_2022))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9946 flags = make_number (i | CODING_ISO_FLAG_FULL_SUPPORT);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9947
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9948 ASET (attrs, coding_attr_iso_initial, initial);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9949 ASET (attrs, coding_attr_iso_usage, reg_usage);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9950 ASET (attrs, coding_attr_iso_request, request);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9951 ASET (attrs, coding_attr_iso_flags, flags);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9952 setup_iso_safe_charsets (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9953
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9954 if (i & CODING_ISO_FLAG_SEVEN_BITS)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9955 category = ((i & (CODING_ISO_FLAG_LOCKING_SHIFT
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9956 | CODING_ISO_FLAG_SINGLE_SHIFT))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9957 ? coding_category_iso_7_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9958 : EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9959 ? coding_category_iso_7
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9960 : coding_category_iso_7_tight);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9961 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9962 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9963 int id = XINT (AREF (initial, 1));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9964
88977
3b05c02eebf2 (Fdefine_coding_system_internal): Fix category setting
Kenichi Handa <handa@m17n.org>
parents: 88950
diff changeset
9965 category = (((i & CODING_ISO_FLAG_LOCKING_SHIFT)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9966 || EQ (args[coding_arg_charset_list], Qiso_2022)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9967 || id < 0)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9968 ? coding_category_iso_8_else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9969 : (CHARSET_DIMENSION (CHARSET_FROM_ID (id)) == 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9970 ? coding_category_iso_8_1
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9971 : coding_category_iso_8_2);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
9972 }
89227
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9973 if (category != coding_category_iso_8_1
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9974 && category != coding_category_iso_8_2)
101ee928c088 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89225
diff changeset
9975 CODING_ATTR_ASCII_COMPAT (attrs) = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9976 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9977 else if (EQ (coding_type, Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9978 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9979 if (EQ (args[coding_arg_charset_list], Qemacs_mule))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9980 ASET (attrs, coding_attr_emacs_mule_full, Qt);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9981 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9982 category = coding_category_emacs_mule;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9983 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9984 else if (EQ (coding_type, Qshift_jis))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9985 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9986
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9987 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9988
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9989 if (XINT (Flength (charset_list)) != 3
89739
293c9235be3f (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89732
diff changeset
9990 && XINT (Flength (charset_list)) != 4)
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
9991 error ("There should be three or four charsets");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9992
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9993 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9994 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9995 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
9996 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9997 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
9998 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
9999
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10000 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10001 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10002 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10003 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10004 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10005
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10006 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10007 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10008 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10009 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10010 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10011
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
10012 charset_list = XCDR (charset_list);
89740
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10013 if (! NILP (charset_list))
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10014 {
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10015 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10016 if (CHARSET_DIMENSION (charset) != 2)
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10017 error ("Dimension of charset %s is not two",
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10018 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
78c1fd14ed42 (Fdefine_coding_system_internal): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89739
diff changeset
10019 }
89732
8acde12aba89 (get_translation_table): New function.
Kenichi Handa <handa@m17n.org>
parents: 89730
diff changeset
10020
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10021 category = coding_category_sjis;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10022 Vsjis_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10023 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10024 else if (EQ (coding_type, Qbig5))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10025 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10026 struct charset *charset;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10027
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10028 if (XINT (Flength (charset_list)) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10029 error ("There should be just two charsets");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10030
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10031 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10032 if (CHARSET_DIMENSION (charset) != 1)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10033 error ("Dimension of charset %s is not one",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10034 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10035 if (CHARSET_ASCII_COMPATIBLE_P (charset))
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10036 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10037
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10038 charset_list = XCDR (charset_list);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10039 charset = CHARSET_FROM_ID (XINT (XCAR (charset_list)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10040 if (CHARSET_DIMENSION (charset) != 2)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10041 error ("Dimension of charset %s is not two",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10042 SDATA (SYMBOL_NAME (CHARSET_NAME (charset))));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10043
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10044 category = coding_category_big5;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10045 Vbig5_coding_system = name;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10046 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10047 else if (EQ (coding_type, Qraw_text))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10048 {
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10049 category = coding_category_raw_text;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10050 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10051 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10052 else if (EQ (coding_type, Qutf_8))
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10053 {
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10054 Lisp_Object bom;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10055
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10056 CODING_ATTR_ASCII_COMPAT (attrs) = Qt;
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10057
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10058 if (nargs < coding_arg_utf8_max)
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10059 goto short_args;
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10060
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10061 bom = args[coding_arg_utf8_bom];
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10062 if (! NILP (bom) && ! EQ (bom, Qt))
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10063 {
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10064 CHECK_CONS (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10065 val = XCAR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10066 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10067 val = XCDR (bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10068 CHECK_CODING_SYSTEM (val);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10069 }
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10070 ASET (attrs, coding_attr_utf_bom, bom);
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10071
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10072 category = (CONSP (bom) ? coding_category_utf_8_auto
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10073 : NILP (bom) ? coding_category_utf_8_nosig
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10074 : coding_category_utf_8_sig);
89225
32058afc72e2 (detect_coding_charset): If only ASCII bytes are found, return 0.
Kenichi Handa <handa@m17n.org>
parents: 89221
diff changeset
10075 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10076 else if (EQ (coding_type, Qundecided))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10077 category = coding_category_undecided;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10078 else
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10079 error ("Invalid coding system type: %s",
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10080 SDATA (SYMBOL_NAME (coding_type)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10081
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10082 CODING_ATTR_CATEGORY (attrs) = make_number (category);
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10083 CODING_ATTR_PLIST (attrs)
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10084 = Fcons (QCcategory, Fcons (AREF (Vcoding_category_table, category),
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10085 CODING_ATTR_PLIST (attrs)));
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10086 CODING_ATTR_PLIST (attrs)
93877
62d97ebb13a9 * coding.c (detect_coding_emacs_mule)
Michael Albinus <michael.albinus@gmx.de>
parents: 93595
diff changeset
10087 = Fcons (QCascii_compatible_p,
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10088 Fcons (CODING_ATTR_ASCII_COMPAT (attrs),
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10089 CODING_ATTR_PLIST (attrs)));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10090
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10091 eol_type = args[coding_arg_eol_type];
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10092 if (! NILP (eol_type)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10093 && ! EQ (eol_type, Qunix)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10094 && ! EQ (eol_type, Qdos)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10095 && ! EQ (eol_type, Qmac))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10096 error ("Invalid eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10097
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10098 aliases = Fcons (name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10099
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10100 if (NILP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10101 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10102 eol_type = make_subsidiaries (name);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10103 for (i = 0; i < 3; i++)
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10104 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10105 Lisp_Object this_spec, this_name, this_aliases, this_eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10106
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10107 this_name = AREF (eol_type, i);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10108 this_aliases = Fcons (this_name, Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10109 this_eol_type = (i == 0 ? Qunix : i == 1 ? Qdos : Qmac);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10110 this_spec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10111 ASET (this_spec, 1, this_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10112 ASET (this_spec, 2, this_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10113 Fputhash (this_name, this_spec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10114 Vcoding_system_list = Fcons (this_name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10115 val = Fassoc (Fsymbol_name (this_name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10116 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10117 Vcoding_system_alist
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10118 = Fcons (Fcons (Fsymbol_name (this_name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10119 Vcoding_system_alist);
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10120 }
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10121 }
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10122
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10123 spec_vec = Fmake_vector (make_number (3), attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10124 ASET (spec_vec, 1, aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10125 ASET (spec_vec, 2, eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10126
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10127 Fputhash (name, spec_vec, Vcoding_system_hash_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10128 Vcoding_system_list = Fcons (name, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10129 val = Fassoc (Fsymbol_name (name), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10130 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10131 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (name), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10132 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10133
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10134 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10135 int id = coding_categories[category].id;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10136
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10137 if (id < 0 || EQ (name, CODING_ID_NAME (id)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10138 setup_coding_system (name, &coding_categories[category]);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10139 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10140
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10141 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10142
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10143 short_args:
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10144 return Fsignal (Qwrong_number_of_arguments,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10145 Fcons (intern ("define-coding-system-internal"),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10146 make_number (nargs)));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10147 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10148
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10149
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10150 DEFUN ("coding-system-put", Fcoding_system_put, Scoding_system_put,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10151 3, 3, 0,
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10152 doc: /* Change value in CODING-SYSTEM's property list PROP to VAL. */)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10153 (coding_system, prop, val)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10154 Lisp_Object coding_system, prop, val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10155 {
89924
7d0f6da3ea6e (detect_coding): Delete unused variables.
Kenichi Handa <handa@m17n.org>
parents: 89917
diff changeset
10156 Lisp_Object spec, attrs;
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10157
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10158 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10159 attrs = AREF (spec, 0);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10160 if (EQ (prop, QCmnemonic))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10161 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10162 if (! STRINGP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10163 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10164 CODING_ATTR_MNEMONIC (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10165 }
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
10166 else if (EQ (prop, QCdefault_char))
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10167 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10168 if (NILP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10169 val = make_number (' ');
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10170 else
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10171 CHECK_CHARACTER (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10172 CODING_ATTR_DEFAULT_CHAR (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10173 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10174 else if (EQ (prop, QCdecode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10175 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10176 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10177 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10178 CODING_ATTR_DECODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10179 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10180 else if (EQ (prop, QCencode_translation_table))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10181 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10182 if (! CHAR_TABLE_P (val) && ! CONSP (val))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10183 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10184 CODING_ATTR_ENCODE_TBL (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10185 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10186 else if (EQ (prop, QCpost_read_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10187 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10188 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10189 CODING_ATTR_POST_READ (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10190 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10191 else if (EQ (prop, QCpre_write_conversion))
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10192 {
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10193 CHECK_SYMBOL (val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10194 CODING_ATTR_PRE_WRITE (attrs) = val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10195 }
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10196 else if (EQ (prop, QCascii_compatible_p))
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10197 {
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10198 CODING_ATTR_ASCII_COMPAT (attrs) = val;
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10199 }
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10200
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10201 CODING_ATTR_PLIST (attrs)
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10202 = Fplist_put (CODING_ATTR_PLIST (attrs), prop, val);
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10203 return val;
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10204 }
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10205
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10206
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10207 DEFUN ("define-coding-system-alias", Fdefine_coding_system_alias,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10208 Sdefine_coding_system_alias, 2, 2, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10209 doc: /* Define ALIAS as an alias for CODING-SYSTEM. */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10210 (alias, coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10211 Lisp_Object alias, coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10212 {
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10213 Lisp_Object spec, aliases, eol_type, val;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10214
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10215 CHECK_SYMBOL (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10216 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10217 aliases = AREF (spec, 1);
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
10218 /* ALIASES should be a list of length more than zero, and the first
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10219 element is a base coding system. Append ALIAS at the tail of the
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10220 list. */
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10221 while (!NILP (XCDR (aliases)))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10222 aliases = XCDR (aliases);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10223 XSETCDR (aliases, Fcons (alias, Qnil));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10224
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10225 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10226 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10227 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10228 Lisp_Object subsidiaries;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10229 int i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10230
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10231 subsidiaries = make_subsidiaries (alias);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10232 for (i = 0; i < 3; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10233 Fdefine_coding_system_alias (AREF (subsidiaries, i),
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10234 AREF (eol_type, i));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10235 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10236
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10237 Fputhash (alias, spec, Vcoding_system_hash_table);
89571
242f2cc0134b (Fdefine_coding_system_alias): Update Vcoding_system_list.
Kenichi Handa <handa@m17n.org>
parents: 89562
diff changeset
10238 Vcoding_system_list = Fcons (alias, Vcoding_system_list);
90289
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10239 val = Fassoc (Fsymbol_name (alias), Vcoding_system_alist);
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10240 if (NILP (val))
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10241 Vcoding_system_alist = Fcons (Fcons (Fsymbol_name (alias), Qnil),
72d8a45f6c9f (Fdefine_coding_system_internal): Avoid a duplicated
Kenichi Handa <handa@m17n.org>
parents: 90272
diff changeset
10242 Vcoding_system_alist);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10243
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10244 return Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10245 }
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10246
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10247 DEFUN ("coding-system-base", Fcoding_system_base, Scoding_system_base,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10248 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10249 doc: /* Return the base of CODING-SYSTEM.
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10250 Any alias or subsidiary coding system is not a base coding system. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10251 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10252 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10253 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10254 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10255
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10256 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10257 return (Qno_conversion);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10258 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10259 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10260 return CODING_ATTR_BASE_NAME (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10261 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10262
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10263 DEFUN ("coding-system-plist", Fcoding_system_plist, Scoding_system_plist,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10264 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10265 doc: "Return the property list of CODING-SYSTEM.")
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10266 (coding_system)
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10267 Lisp_Object coding_system;
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10268 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10269 Lisp_Object spec, attrs;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10270
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10271 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10272 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10273 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10274 attrs = AREF (spec, 0);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10275 return CODING_ATTR_PLIST (attrs);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10276 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10277
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10278
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10279 DEFUN ("coding-system-aliases", Fcoding_system_aliases, Scoding_system_aliases,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10280 1, 1, 0,
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10281 doc: /* Return the list of aliases of CODING-SYSTEM. */)
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10282 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10283 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10284 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10285 Lisp_Object spec;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10286
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10287 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10288 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10289 CHECK_CODING_SYSTEM_GET_SPEC (coding_system, spec);
88645
d099a8b267fe Doc fixes.
Dave Love <fx@gnu.org>
parents: 88631
diff changeset
10290 return AREF (spec, 1);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10291 }
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10292
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10293 DEFUN ("coding-system-eol-type", Fcoding_system_eol_type,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10294 Scoding_system_eol_type, 1, 1, 0,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10295 doc: /* Return eol-type of CODING-SYSTEM.
95088
524350e4961c (Fcoding_system_p): Rename argument to match docstring.
Juanma Barranquero <lekktu@gmail.com>
parents: 94963
diff changeset
10296 An eol-type is an integer 0, 1, 2, or a vector of coding systems.
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10297
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10298 Integer values 0, 1, and 2 indicate a format of end-of-line; LF, CRLF,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10299 and CR respectively.
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10300
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10301 A vector value indicates that a format of end-of-line should be
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10302 detected automatically. Nth element of the vector is the subsidiary
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10303 coding system whose eol-type is N. */)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10304 (coding_system)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10305 Lisp_Object coding_system;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10306 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10307 Lisp_Object spec, eol_type;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10308 int n;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10309
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10310 if (NILP (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10311 coding_system = Qno_conversion;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10312 if (! CODING_SYSTEM_P (coding_system))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10313 return Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10314 spec = CODING_SYSTEM_SPEC (coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10315 eol_type = AREF (spec, 2);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10316 if (VECTORP (eol_type))
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10317 return Fcopy_sequence (eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10318 n = EQ (eol_type, Qunix) ? 0 : EQ (eol_type, Qdos) ? 1 : 2;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10319 return make_number (n);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10320 }
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10321
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10322 #endif /* emacs */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10323
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10324
22874
b133f07a76db (Qvalid_codes): New variable.
Kenichi Handa <handa@m17n.org>
parents: 22812
diff changeset
10325 /*** 9. Post-amble ***/
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10326
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
10327 void
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10328 init_coding_once ()
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10329 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10330 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10331
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10332 for (i = 0; i < coding_category_max; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10333 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10334 coding_categories[i].id = -1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10335 coding_priorities[i] = i;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10336 }
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10337
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10338 /* ISO2022 specific initialize routine. */
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10339 for (i = 0; i < 0x20; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
10340 iso_code_class[i] = ISO_control_0;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10341 for (i = 0x21; i < 0x7F; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10342 iso_code_class[i] = ISO_graphic_plane_0;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10343 for (i = 0x80; i < 0xA0; i++)
29005
b396df3a5181 (ONE_MORE_BYTE, TWO_MORE_BYTES): Set coding->resutl to
Kenichi Handa <handa@m17n.org>
parents: 28512
diff changeset
10344 iso_code_class[i] = ISO_control_1;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10345 for (i = 0xA1; i < 0xFF; i++)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10346 iso_code_class[i] = ISO_graphic_plane_1;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10347 iso_code_class[0x20] = iso_code_class[0x7F] = ISO_0x20_or_0x7F;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10348 iso_code_class[0xA0] = iso_code_class[0xFF] = ISO_0xA0_or_0xFF;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10349 iso_code_class[ISO_CODE_SO] = ISO_shift_out;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10350 iso_code_class[ISO_CODE_SI] = ISO_shift_in;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10351 iso_code_class[ISO_CODE_SS2_7] = ISO_single_shift_2_7;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10352 iso_code_class[ISO_CODE_ESC] = ISO_escape;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10353 iso_code_class[ISO_CODE_SS2] = ISO_single_shift_2;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10354 iso_code_class[ISO_CODE_SS3] = ISO_single_shift_3;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10355 iso_code_class[ISO_CODE_CSI] = ISO_control_sequence_introducer;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10356
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10357 for (i = 0; i < 256; i++)
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10358 {
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10359 emacs_mule_bytes[i] = 1;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10360 }
88876
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10361 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_11] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10362 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_12] = 3;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10363 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_21] = 4;
af9012fdad56 (LEADING_CODE_PRIVATE_11, LEADING_CODE_PRIVATE_12,
Kenichi Handa <handa@m17n.org>
parents: 88862
diff changeset
10364 emacs_mule_bytes[EMACS_MULE_LEADING_CODE_PRIVATE_22] = 4;
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10365 }
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10366
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10367 #ifdef emacs
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10368
21514
fa9ff387d260 Fix -Wimplicit warnings.
Andreas Schwab <schwab@suse.de>
parents: 21505
diff changeset
10369 void
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10370 syms_of_coding ()
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10371 {
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10372 staticpro (&Vcoding_system_hash_table);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10373 {
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10374 Lisp_Object args[2];
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10375 args[0] = QCtest;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10376 args[1] = Qeq;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10377 Vcoding_system_hash_table = Fmake_hash_table (2, args);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10378 }
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10379
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10380 staticpro (&Vsjis_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10381 Vsjis_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10382
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10383 staticpro (&Vbig5_coding_system);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10384 Vbig5_coding_system = Qnil;
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10385
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10386 staticpro (&Vcode_conversion_reused_workbuf);
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10387 Vcode_conversion_reused_workbuf = Qnil;
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10388
58637
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
10389 staticpro (&Vcode_conversion_workbuf_name);
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
10390 Vcode_conversion_workbuf_name = build_string (" *code-conversion-work*");
ff8a37b5299b (Vcode_conversion_workbuf_name): New variable.
Kenichi Handa <handa@m17n.org>
parents: 58502
diff changeset
10391
89665
9010cefe8d29 (enum iso_code_class_type): Delete ISO_carriage_return.
Kenichi Handa <handa@m17n.org>
parents: 89653
diff changeset
10392 reused_workbuf_in_use = 0;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10393
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10394 DEFSYM (Qcharset, "charset");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10395 DEFSYM (Qtarget_idx, "target-idx");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10396 DEFSYM (Qcoding_system_history, "coding-system-history");
19750
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
10397 Fset (Qcoding_system_history, Qnil);
95e4e1cba6ac (Qcoding_system_history): New variable.
Richard M. Stallman <rms@gnu.org>
parents: 19747
diff changeset
10398
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10399 /* Target FILENAME is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10400 Fput (Qinsert_file_contents, Qtarget_idx, make_number (0));
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10401 /* Target FILENAME is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10402 Fput (Qwrite_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10403
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10404 DEFSYM (Qcall_process, "call-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10405 /* Target PROGRAM is the first argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10406 Fput (Qcall_process, Qtarget_idx, make_number (0));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10407
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10408 DEFSYM (Qcall_process_region, "call-process-region");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10409 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10410 Fput (Qcall_process_region, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10411
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10412 DEFSYM (Qstart_process, "start-process");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10413 /* Target PROGRAM is the third argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10414 Fput (Qstart_process, Qtarget_idx, make_number (2));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10415
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10416 DEFSYM (Qopen_network_stream, "open-network-stream");
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10417 /* Target SERVICE is the fourth argument. */
17119
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10418 Fput (Qopen_network_stream, Qtarget_idx, make_number (3));
2cfb31c15ced (create_process, Fopen_network_stream): Typo in indexes
Kenichi Handa <handa@m17n.org>
parents: 17071
diff changeset
10419
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10420 DEFSYM (Qcoding_system, "coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10421 DEFSYM (Qcoding_aliases, "coding-aliases");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10422
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10423 DEFSYM (Qeol_type, "eol-type");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10424 DEFSYM (Qunix, "unix");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10425 DEFSYM (Qdos, "dos");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10426
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10427 DEFSYM (Qbuffer_file_coding_system, "buffer-file-coding-system");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10428 DEFSYM (Qpost_read_conversion, "post-read-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10429 DEFSYM (Qpre_write_conversion, "pre-write-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10430 DEFSYM (Qdefault_char, "default-char");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10431 DEFSYM (Qundecided, "undecided");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10432 DEFSYM (Qno_conversion, "no-conversion");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10433 DEFSYM (Qraw_text, "raw-text");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10434
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10435 DEFSYM (Qiso_2022, "iso-2022");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10436
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10437 DEFSYM (Qutf_8, "utf-8");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10438 DEFSYM (Qutf_8_emacs, "utf-8-emacs");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10439
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10440 DEFSYM (Qutf_16, "utf-16");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10441 DEFSYM (Qbig, "big");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10442 DEFSYM (Qlittle, "little");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10443
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10444 DEFSYM (Qshift_jis, "shift-jis");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10445 DEFSYM (Qbig5, "big5");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10446
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10447 DEFSYM (Qcoding_system_p, "coding-system-p");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10448
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10449 DEFSYM (Qcoding_system_error, "coding-system-error");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10450 Fput (Qcoding_system_error, Qerror_conditions,
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10451 Fcons (Qcoding_system_error, Fcons (Qerror, Qnil)));
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10452 Fput (Qcoding_system_error, Qerror_message,
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10453 build_string ("Invalid coding system"));
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10454
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10455 /* Intern this now in case it isn't already done.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10456 Setting this variable twice is harmless.
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10457 But don't staticpro it here--that is done in alloc.c. */
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10458 Qchar_table_extra_slots = intern ("char-table-extra-slots");
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10459
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10460 DEFSYM (Qtranslation_table, "translation-table");
89856
18b52da60a76 (get_translation): Fix previous change.
Kenichi Handa <handa@m17n.org>
parents: 89852
diff changeset
10461 Fput (Qtranslation_table, Qchar_table_extra_slots, make_number (2));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10462 DEFSYM (Qtranslation_table_id, "translation-table-id");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10463 DEFSYM (Qtranslation_table_for_decode, "translation-table-for-decode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10464 DEFSYM (Qtranslation_table_for_encode, "translation-table-for-encode");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10465
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10466 DEFSYM (Qvalid_codes, "valid-codes");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10467
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10468 DEFSYM (Qemacs_mule, "emacs-mule");
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10469
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10470 DEFSYM (QCcategory, ":category");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10471 DEFSYM (QCmnemonic, ":mnemonic");
100303
3e044fa54e4f * coding.c (QCdefault_char): Rename from QCdefalut_char.
Juanma Barranquero <lekktu@gmail.com>
parents: 100262
diff changeset
10472 DEFSYM (QCdefault_char, ":default-char");
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10473 DEFSYM (QCdecode_translation_table, ":decode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10474 DEFSYM (QCencode_translation_table, ":encode-translation-table");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10475 DEFSYM (QCpost_read_conversion, ":post-read-conversion");
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10476 DEFSYM (QCpre_write_conversion, ":pre-write-conversion");
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10477 DEFSYM (QCascii_compatible_p, ":ascii-compatible-p");
89468
7dbbe692f70c * coding.c (QCcategory): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89467
diff changeset
10478
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10479 Vcoding_category_table
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10480 = Fmake_vector (make_number (coding_category_max), Qnil);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10481 staticpro (&Vcoding_category_table);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10482 /* Followings are target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10483 ASET (Vcoding_category_table, coding_category_iso_7,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10484 intern ("coding-category-iso-7"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10485 ASET (Vcoding_category_table, coding_category_iso_7_tight,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10486 intern ("coding-category-iso-7-tight"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10487 ASET (Vcoding_category_table, coding_category_iso_8_1,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10488 intern ("coding-category-iso-8-1"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10489 ASET (Vcoding_category_table, coding_category_iso_8_2,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10490 intern ("coding-category-iso-8-2"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10491 ASET (Vcoding_category_table, coding_category_iso_7_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10492 intern ("coding-category-iso-7-else"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10493 ASET (Vcoding_category_table, coding_category_iso_8_else,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10494 intern ("coding-category-iso-8-else"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10495 ASET (Vcoding_category_table, coding_category_utf_8_auto,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10496 intern ("coding-category-utf-8-auto"));
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10497 ASET (Vcoding_category_table, coding_category_utf_8_nosig,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10498 intern ("coding-category-utf-8"));
95397
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10499 ASET (Vcoding_category_table, coding_category_utf_8_sig,
c99f0a16c077 (CODING_UTF_8_BOM): New macro.
Kenichi Handa <handa@m17n.org>
parents: 95356
diff changeset
10500 intern ("coding-category-utf-8-sig"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10501 ASET (Vcoding_category_table, coding_category_utf_16_be,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10502 intern ("coding-category-utf-16-be"));
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10503 ASET (Vcoding_category_table, coding_category_utf_16_auto,
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10504 intern ("coding-category-utf-16-auto"));
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10505 ASET (Vcoding_category_table, coding_category_utf_16_le,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10506 intern ("coding-category-utf-16-le"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10507 ASET (Vcoding_category_table, coding_category_utf_16_be_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10508 intern ("coding-category-utf-16-be-nosig"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10509 ASET (Vcoding_category_table, coding_category_utf_16_le_nosig,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10510 intern ("coding-category-utf-16-le-nosig"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10511 ASET (Vcoding_category_table, coding_category_charset,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10512 intern ("coding-category-charset"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10513 ASET (Vcoding_category_table, coding_category_sjis,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10514 intern ("coding-category-sjis"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10515 ASET (Vcoding_category_table, coding_category_big5,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10516 intern ("coding-category-big5"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10517 ASET (Vcoding_category_table, coding_category_ccl,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10518 intern ("coding-category-ccl"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10519 ASET (Vcoding_category_table, coding_category_emacs_mule,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10520 intern ("coding-category-emacs-mule"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10521 /* Followings are NOT target of code detection. */
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10522 ASET (Vcoding_category_table, coding_category_raw_text,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10523 intern ("coding-category-raw-text"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10524 ASET (Vcoding_category_table, coding_category_undecided,
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10525 intern ("coding-category-undecided"));
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10526
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10527 DEFSYM (Qinsufficient_source, "insufficient-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10528 DEFSYM (Qinconsistent_eol, "inconsistent-eol");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10529 DEFSYM (Qinvalid_source, "invalid-source");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10530 DEFSYM (Qinterrupted, "interrupted");
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10531 DEFSYM (Qinsufficient_memory, "insufficient-memory");
90272
f1df126ec7de Sync to HEAD for handling autoload-coding-system.
Kenichi Handa <handa@m17n.org>
parents: 90263
diff changeset
10532 DEFSYM (Qcoding_system_define_form, "coding-system-define-form");
52794
f4d906e31662 (Qcoding_system_define_form): New variable.
Kenichi Handa <handa@m17n.org>
parents: 52401
diff changeset
10533
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10534 defsubr (&Scoding_system_p);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10535 defsubr (&Sread_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10536 defsubr (&Sread_non_nil_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10537 defsubr (&Scheck_coding_system);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10538 defsubr (&Sdetect_coding_region);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10539 defsubr (&Sdetect_coding_string);
30487
6165da9c89c6 (Qsafe_charsets): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 30384
diff changeset
10540 defsubr (&Sfind_coding_systems_region_internal);
46859
a26dd8891732 (unencodable_char_position): New function.
Kenichi Handa <handa@m17n.org>
parents: 46839
diff changeset
10541 defsubr (&Sunencodable_char_position);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10542 defsubr (&Scheck_coding_systems_region);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10543 defsubr (&Sdecode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10544 defsubr (&Sencode_coding_region);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10545 defsubr (&Sdecode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10546 defsubr (&Sencode_coding_string);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10547 defsubr (&Sdecode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10548 defsubr (&Sencode_sjis_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10549 defsubr (&Sdecode_big5_char);
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10550 defsubr (&Sencode_big5_char);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10551 defsubr (&Sset_terminal_coding_system_internal);
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10552 defsubr (&Sset_safe_terminal_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10553 defsubr (&Sterminal_coding_system);
18002
a14261786239 (encode_invocation_designation): Use macro
Kenichi Handa <handa@m17n.org>
parents: 17835
diff changeset
10554 defsubr (&Sset_keyboard_coding_system_internal);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10555 defsubr (&Skeyboard_coding_system);
18536
69c0e220b626 (Vstandard_character_unification_table_for_decode):
Kenichi Handa <handa@m17n.org>
parents: 18523
diff changeset
10556 defsubr (&Sfind_operation_coding_system);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10557 defsubr (&Sset_coding_system_priority);
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10558 defsubr (&Sdefine_coding_system_internal);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10559 defsubr (&Sdefine_coding_system_alias);
89759
d11866e9fbf4 (QCmnemonic, QCdefalut_char)
Kenichi Handa <handa@m17n.org>
parents: 89740
diff changeset
10560 defsubr (&Scoding_system_put);
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10561 defsubr (&Scoding_system_base);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10562 defsubr (&Scoding_system_plist);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10563 defsubr (&Scoding_system_aliases);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10564 defsubr (&Scoding_system_eol_type);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10565 defsubr (&Scoding_system_priority_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10566
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10567 DEFVAR_LISP ("coding-system-list", &Vcoding_system_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10568 doc: /* List of coding systems.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10569
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10570 Do not alter the value of this variable manually. This variable should be
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10571 updated by the functions `define-coding-system' and
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10572 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10573 Vcoding_system_list = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10574
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10575 DEFVAR_LISP ("coding-system-alist", &Vcoding_system_alist,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10576 doc: /* Alist of coding system names.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10577 Each element is one element list of coding system name.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10578 This variable is given to `completing-read' as COLLECTION argument.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10579
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10580 Do not alter the value of this variable manually. This variable should be
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10581 updated by the functions `make-coding-system' and
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10582 `define-coding-system-alias'. */);
20105
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10583 Vcoding_system_alist = Qnil;
c017642863c2 (Qcoding_system_spec): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 19824
diff changeset
10584
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10585 DEFVAR_LISP ("coding-category-list", &Vcoding_category_list,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10586 doc: /* List of coding-categories (symbols) ordered by priority.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10587
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10588 On detecting a coding system, Emacs tries code detection algorithms
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10589 associated with each coding-category one by one in this order. When
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10590 one algorithm agrees with a byte sequence of source text, the coding
60608
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10591 system bound to the corresponding coding-category is selected.
4b80e9c28e8f (syms_of_coding): Docstring of coding-category-list fixed.
Kenichi Handa <handa@m17n.org>
parents: 60031
diff changeset
10592
61166
e3a6dd630fdf (Vcoding_category_list): Docstring fix.
Kenichi Handa <handa@m17n.org>
parents: 60907
diff changeset
10593 Don't modify this variable directly, but use `set-coding-priority'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10594 {
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10595 int i;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10596
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10597 Vcoding_category_list = Qnil;
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10598 for (i = coding_category_max - 1; i >= 0; i--)
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10599 Vcoding_category_list
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10600 = Fcons (XVECTOR (Vcoding_category_table)->contents[i],
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10601 Vcoding_category_list);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10602 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10603
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10604 DEFVAR_LISP ("coding-system-for-read", &Vcoding_system_for_read,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10605 doc: /* Specify the coding system for read operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10606 It is useful to bind this variable with `let', but do not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10607 If the value is a coding system, it is used for decoding on read operation.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10608 If not, an appropriate element is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10609 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10610 `process-coding-system-alist', and `network-coding-system-alist'. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10611 Vcoding_system_for_read = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10612
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10613 DEFVAR_LISP ("coding-system-for-write", &Vcoding_system_for_write,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10614 doc: /* Specify the coding system for write operations.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10615 Programs bind this variable with `let', but you should not set it globally.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10616 If the value is a coding system, it is used for encoding of output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10617 when writing it to a file and when sending it to a file or subprocess.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10618
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10619 If this does not specify a coding system, an appropriate element
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10620 is used from one of the coding system alists.
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10621 There are three such tables: `file-coding-system-alist',
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10622 `process-coding-system-alist', and `network-coding-system-alist'.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10623 For output to files, if the above procedure does not specify a coding system,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10624 the value of `buffer-file-coding-system' is used. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10625 Vcoding_system_for_write = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10626
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10627 DEFVAR_LISP ("last-coding-system-used", &Vlast_coding_system_used,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10628 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10629 Coding system used in the latest file or process I/O. */);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10630 Vlast_coding_system_used = Qnil;
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10631
89686
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10632 DEFVAR_LISP ("last-code-conversion-error", &Vlast_code_conversion_error,
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10633 doc: /*
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10634 Error status of the last code conversion.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10635
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10636 When an error was detected in the last code conversion, this variable
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10637 is set to one of the following symbols.
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10638 `insufficient-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10639 `inconsistent-eol'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10640 `invalid-source'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10641 `interrupted'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10642 `insufficient-memory'
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10643 When no error was detected, the value doesn't change. So, to check
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10644 the error status of a code conversion by this variable, you must
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10645 explicitly set this variable to nil before performing code
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10646 conversion. */);
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10647 Vlast_code_conversion_error = Qnil;
9bfefb13fe83 (Qinsufficient_source, Qinconsistent_eol)
Kenichi Handa <handa@m17n.org>
parents: 89676
diff changeset
10648
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10649 DEFVAR_BOOL ("inhibit-eol-conversion", &inhibit_eol_conversion,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10650 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10651 *Non-nil means always inhibit code conversion of end-of-line format.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10652 See info node `Coding Systems' and info node `Text and Binary' concerning
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10653 such conversion. */);
18650
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10654 inhibit_eol_conversion = 0;
aa3f2820e2ac (Qemacs_mule, inhibit_eol_conversion): New variables.
Kenichi Handa <handa@m17n.org>
parents: 18613
diff changeset
10655
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10656 DEFVAR_BOOL ("inherit-process-coding-system", &inherit_process_coding_system,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10657 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10658 Non-nil means process buffer inherits coding system of process output.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10659 Bind it to t if the process output is to be treated as if it were a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10660 read from some filesystem. */);
21574
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10661 inherit_process_coding_system = 0;
30394e3ae7f8 (syms_of_coding): Declare and define inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents: 21520
diff changeset
10662
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10663 DEFVAR_LISP ("file-coding-system-alist", &Vfile_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10664 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10665 Alist to decide a coding system to use for a file I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10666 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10667 where PATTERN is a regular expression matching a file name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10668 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10669 If VAL is a coding system, it is used for both decoding and encoding
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10670 the file contents.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10671 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10672 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10673 If VAL is a function symbol, the function must return a coding system
72323
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10674 or a cons of coding systems which are used as above. The function is
af796bc81ff0 (syms_of_coding): Improve the docstring
Kenichi Handa <handa@m17n.org>
parents: 72188
diff changeset
10675 called with an argument that is a list of the arguments with which
81611
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10676 `find-operation-coding-system' was called. If the function can't decide
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10677 a coding system, it can return `undecided' so that the normal
ae42ad5f89e6 (Ffind_operation_coding_system): Docstring improved.
Kenichi Handa <handa@m17n.org>
parents: 75348
diff changeset
10678 code-detection is performed.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10679
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10680 See also the function `find-operation-coding-system'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10681 and the variable `auto-coding-alist'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10682 Vfile_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10683
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10684 DEFVAR_LISP ("process-coding-system-alist", &Vprocess_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10685 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10686 Alist to decide a coding system to use for a process I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10687 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10688 where PATTERN is a regular expression matching a program name,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10689 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10690 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10691 from the program and encoding what sent to the program.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10692 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10693 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10694 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10695 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10696
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10697 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10698 Vprocess_coding_system_alist = Qnil;
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10699
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10700 DEFVAR_LISP ("network-coding-system-alist", &Vnetwork_coding_system_alist,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10701 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10702 Alist to decide a coding system to use for a network I/O operation.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10703 The format is ((PATTERN . VAL) ...),
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10704 where PATTERN is a regular expression matching a network service name
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10705 or is a port number to connect to,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10706 VAL is a coding system, a cons of coding systems, or a function symbol.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10707 If VAL is a coding system, it is used for both decoding what received
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10708 from the network stream and encoding what sent to the network stream.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10709 If VAL is a cons of coding systems, the car part is used for decoding,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10710 and the cdr part is used for encoding.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10711 If VAL is a function symbol, the function must return a coding system
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10712 or a cons of coding systems which are used as above.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10714 See also the function `find-operation-coding-system'. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10715 Vnetwork_coding_system_alist = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10716
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10717 DEFVAR_LISP ("locale-coding-system", &Vlocale_coding_system,
41026
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10718 doc: /* Coding system to use with system messages.
6f20449b7e12 (syms_of_coding): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents: 41006
diff changeset
10719 Also used for decoding keyboard input on X Window system. */);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10720 Vlocale_coding_system = Qnil;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10721
29182
1d1c27067af4 (encode_eol): Add null statement after label.
Dave Love <fx@gnu.org>
parents: 29172
diff changeset
10722 /* The eol mnemonics are reset in startup.el system-dependently. */
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10723 DEFVAR_LISP ("eol-mnemonic-unix", &eol_mnemonic_unix,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10724 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10725 *String displayed in mode line for UNIX-like (LF) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10726 eol_mnemonic_unix = build_string (":");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10727
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10728 DEFVAR_LISP ("eol-mnemonic-dos", &eol_mnemonic_dos,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10729 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10730 *String displayed in mode line for DOS-like (CRLF) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10731 eol_mnemonic_dos = build_string ("\\");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10732
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10733 DEFVAR_LISP ("eol-mnemonic-mac", &eol_mnemonic_mac,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10734 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10735 *String displayed in mode line for MAC-like (CR) end-of-line format. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10736 eol_mnemonic_mac = build_string ("/");
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10737
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10738 DEFVAR_LISP ("eol-mnemonic-undecided", &eol_mnemonic_undecided,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10739 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10740 *String displayed in mode line when end-of-line format is not yet determined. */);
24200
b9d9fccad516 (syms_of_coding): eol-mnemonic-* variables are now
Eli Zaretskii <eliz@gnu.org>
parents: 24178
diff changeset
10741 eol_mnemonic_undecided = build_string (":");
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10742
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10743 DEFVAR_LISP ("enable-character-translation", &Venable_character_translation,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10744 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10745 *Non-nil enables character translation while encoding and decoding. */);
22119
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10746 Venable_character_translation = Qt;
592bb8b9bcfd Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents: 22020
diff changeset
10747
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10748 DEFVAR_LISP ("standard-translation-table-for-decode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10749 &Vstandard_translation_table_for_decode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10750 doc: /* Table for translating characters while decoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10751 Vstandard_translation_table_for_decode = Qnil;
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10752
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10753 DEFVAR_LISP ("standard-translation-table-for-encode",
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10754 &Vstandard_translation_table_for_encode,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10755 doc: /* Table for translating characters while encoding. */);
22186
fc4aaf1b1772 Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents: 22166
diff changeset
10756 Vstandard_translation_table_for_encode = Qnil;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10757
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10758 DEFVAR_LISP ("charset-revision-table", &Vcharset_revision_table,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10759 doc: /* Alist of charsets vs revision numbers.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10760 While encoding, if a charset (car part of an element) is found,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10761 designate it with the escape sequence identifying revision (cdr part
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10762 of the element). */);
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10763 Vcharset_revision_table = Qnil;
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10764
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10765 DEFVAR_LISP ("default-process-coding-system",
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10766 &Vdefault_process_coding_system,
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10767 doc: /* Cons of coding systems used for process I/O by default.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10768 The car part is used for decoding a process output,
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10769 the cdr part is used for encoding a text to be sent to a process. */);
18180
5f4c4da24e75 (Vcoding_system_alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents: 18002
diff changeset
10770 Vdefault_process_coding_system = Qnil;
19280
e755044718ee (ENCODE_ISO_CHARACTER_DIMENSION1): Pay attention to
Kenichi Handa <handa@m17n.org>
parents: 19193
diff changeset
10771
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10772 DEFVAR_LISP ("latin-extra-code-table", &Vlatin_extra_code_table,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10773 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10774 Table of extra Latin codes in the range 128..159 (inclusive).
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10775 This is a vector of length 256.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10776 If Nth element is non-nil, the existence of code N in a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10777 \(or output of subprocess) doesn't prevent it to be detected as
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10778 a coding system of ISO 2022 variant which has a flag
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10779 `accept-latin-extra-code' t (e.g. iso-latin-1) on reading a file
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10780 or reading output of a subprocess.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10781 Only 128th through 159th elements have a meaning. */);
19365
d9374f5ebd3a (CODING_FLAG_ISO_LATIN_EXTRA): New macro.
Kenichi Handa <handa@m17n.org>
parents: 19285
diff changeset
10782 Vlatin_extra_code_table = Fmake_vector (make_number (256), Qnil);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10783
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10784 DEFVAR_LISP ("select-safe-coding-system-function",
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10785 &Vselect_safe_coding_system_function,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10786 doc: /*
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10787 Function to call to select safe coding system for encoding a text.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10788
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10789 If set, this function is called to force a user to select a proper
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10790 coding system which can encode the text in the case that a default
87778
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10791 coding system used in each operation can't encode the text. The
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10792 function should take care that the buffer is not modified while
0ec6f8d26078 (select-safe-coding-system-function): Doc fix.
Glenn Morris <rgm@gnu.org>
parents: 87710
diff changeset
10793 the coding system is being selected.
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10794
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10795 The default value is `select-safe-coding-system' (which see). */);
20718
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10796 Vselect_safe_coding_system_function = Qnil;
c600dea3b06b Vselect_safe_coding_system_function): New variable.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
10797
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10798 DEFVAR_BOOL ("coding-system-require-warning",
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10799 &coding_system_require_warning,
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10800 doc: /* Internal use only.
49539
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10801 If non-nil, on writing a file, `select-safe-coding-system-function' is
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10802 called even if `coding-system-for-write' is non-nil. The command
1ad5bfbb831a (syms_of_coding): Add `...' for symbols in the docstring of
Kenichi Handa <handa@m17n.org>
parents: 48874
diff changeset
10803 `universal-coding-system-argument' binds this variable to t temporarily. */);
48874
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10804 coding_system_require_warning = 0;
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10805
3002a87cc629 (coding_system_require_warning): New variable.
Kenichi Handa <handa@m17n.org>
parents: 48829
diff changeset
10806
30292
14a9937df1f5 (syms_of_coding): Fix typo in spelling of variable
Gerd Moellmann <gerd@gnu.org>
parents: 30263
diff changeset
10807 DEFVAR_BOOL ("inhibit-iso-escape-detection",
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10808 &inhibit_iso_escape_detection,
88365
d29ddd7d50f9 Completely re-written.
Kenichi Handa <handa@m17n.org>
parents: 43041
diff changeset
10809 doc: /*
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10810 If non-nil, Emacs ignores ISO-2022 escape sequences during code detection.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10811
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10812 When Emacs reads text, it tries to detect how the text is encoded.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10813 This code detection is sensitive to escape sequences. If Emacs sees
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10814 a valid ISO-2022 escape sequence, it assumes the text is encoded in one
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10815 of the ISO2022 encodings, and decodes text by the corresponding coding
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10816 system (e.g. `iso-2022-7bit').
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10817
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10818 However, there may be a case that you want to read escape sequences in
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10819 a file as is. In such a case, you can set this variable to non-nil.
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10820 Then the code detection will ignore any escape sequences, and no text is
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10821 detected as encoded in some ISO-2022 encoding. The result is that all
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10822 escape sequences become visible in a buffer.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10823
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10824 The default value is nil, and it is strongly recommended not to change
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10825 it. That is because many Emacs Lisp source files that contain
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10826 non-ASCII characters are encoded by the coding system `iso-2022-7bit'
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10827 in Emacs's distribution, and they won't be decoded correctly on
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10828 reading if you suppress escape sequence detection.
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10829
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10830 The other way to read escape sequences in a file without decoding is
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10831 to explicitly specify some coding system that doesn't use ISO-2022
40713
42351475da08 Change doc-string comments to `new style' [w/`doc:' keyword].
Pavel Janík <Pavel@Janik.cz>
parents: 40656
diff changeset
10832 escape sequence (e.g `latin-1') on reading by \\[universal-coding-system-argument]. */);
30204
35aec8514228 (inhibit_iso_escape_detection): New variable.
Kenichi Handa <handa@m17n.org>
parents: 29985
diff changeset
10833 inhibit_iso_escape_detection = 0;
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10834
101040
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10835 DEFVAR_BOOL ("inhibit-null-byte-detection",
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10836 &inhibit_null_byte_detection,
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10837 doc: /* If non-nil, Emacs ignores null bytes on code detection.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10838 By default, Emacs treats it as binary data, and does not attempt to
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10839 decode it. The effect is as if you specified `no-conversion' for
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10840 reading that text.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10841
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10842 Set this to non-nil when a regular text happens to include null bytes.
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10843 Examples are Index nodes of Info files and null-byte delimited output
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10844 from GNU Find and GNU Grep. Emacs will then ignore the null bytes and
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10845 decode text as usual. */);
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10846 inhibit_null_byte_detection = 0;
92b6c5b767f8 Fix Bug #876:
Eli Zaretskii <eliz@gnu.org>
parents: 100951
diff changeset
10847
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10848 DEFVAR_LISP ("translation-table-for-input", &Vtranslation_table_for_input,
48230
c2ce8280fb97 (Vtranslation_table_for_input): New.
Dave Love <fx@gnu.org>
parents: 48182
diff changeset
10849 doc: /* Char table for translating self-inserting characters.
95356
90b4a0dc21cc (Fdecode_coding_region, Fencode_coding_region, Fencode_coding_string):
Juanma Barranquero <lekktu@gmail.com>
parents: 95353
diff changeset
10850 This is applied to the result of input methods, not their input.
101854
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10851 See also `keyboard-translate-table'.
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10852
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10853 Use of this variable for character code unification was rendered
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10854 obsolete in Emacs 23.1 and later, since Unicode is now the basis of
7e576fc18303 (syms_of_coding) <translation-table-for-input>: Modify doc string to
Eli Zaretskii <eliz@gnu.org>
parents: 101776
diff changeset
10855 internal character representation. */);
48182
9474e269efd1 Reformat some DEFUNs so that etags works.
Dave Love <fx@gnu.org>
parents: 48125
diff changeset
10856 Vtranslation_table_for_input = Qnil;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10857
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10858 {
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10859 Lisp_Object args[coding_arg_max];
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10860 Lisp_Object plist[16];
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10861 int i;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10862
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10863 for (i = 0; i < coding_arg_max; i++)
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10864 args[i] = Qnil;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10865
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10866 plist[0] = intern (":name");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10867 plist[1] = args[coding_arg_name] = Qno_conversion;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10868 plist[2] = intern (":mnemonic");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10869 plist[3] = args[coding_arg_mnemonic] = make_number ('=');
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10870 plist[4] = intern (":coding-type");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10871 plist[5] = args[coding_arg_coding_type] = Qraw_text;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10872 plist[6] = intern (":ascii-compatible-p");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10873 plist[7] = args[coding_arg_ascii_compatible_p] = Qt;
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10874 plist[8] = intern (":default-char");
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10875 plist[9] = args[coding_arg_default_char] = make_number (0);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10876 plist[10] = intern (":for-unibyte");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10877 plist[11] = args[coding_arg_for_unibyte] = Qt;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10878 plist[12] = intern (":docstring");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10879 plist[13] = build_string ("Do no conversion.\n\
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10880 \n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10881 When you visit a file with this coding, the file is read into a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10882 unibyte buffer as is, thus each byte of a file is treated as a\n\
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10883 character.");
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10884 plist[14] = intern (":eol-type");
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10885 plist[15] = args[coding_arg_eol_type] = Qunix;
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89481
diff changeset
10886 args[coding_arg_plist] = Flist (16, plist);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10887 Fdefine_coding_system_internal (coding_arg_max, args);
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10888
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10889 plist[1] = args[coding_arg_name] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10890 plist[3] = args[coding_arg_mnemonic] = make_number ('-');
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10891 plist[5] = args[coding_arg_coding_type] = Qundecided;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10892 /* This is already set.
90214
460ee00505d5 (QCascii_compatible_p): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90201
diff changeset
10893 plist[7] = args[coding_arg_ascii_compatible_p] = Qt; */
90011
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10894 plist[8] = intern (":charset-list");
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10895 plist[9] = args[coding_arg_charset_list] = Fcons (Qascii, Qnil);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10896 plist[11] = args[coding_arg_for_unibyte] = Qnil;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10897 plist[13] = build_string ("No conversion on encoding, automatic conversion on decoding.");
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10898 plist[15] = args[coding_arg_eol_type] = Qnil;
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10899 args[coding_arg_plist] = Flist (16, plist);
26cef35a1562 (setup_coding_system): If coding_system is nil, use
Kenichi Handa <handa@m17n.org>
parents: 89976
diff changeset
10900 Fdefine_coding_system_internal (coding_arg_max, args);
88456
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10901 }
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10902
a7b309f72920 (coding_alloc_by_making_gap): Check the case that the
Kenichi Handa <handa@m17n.org>
parents: 88443
diff changeset
10903 setup_coding_system (Qno_conversion, &safe_terminal_coding);
89467
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10904
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10905 {
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10906 int i;
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10907
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10908 for (i = 0; i < coding_category_max; i++)
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10909 Fset (AREF (Vcoding_category_table, i), Qno_conversion);
e911ca706166 (Fset_coding_system_priority): Doc fix. Update values
Kenichi Handa <handa@m17n.org>
parents: 89462
diff changeset
10910 }
90394
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10911 #if defined (MSDOS) || defined (WINDOWSNT)
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10912 system_eol_type = Qdos;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10913 #else
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10914 system_eol_type = Qunix;
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10915 #endif
263867fe7b55 (system_eol_type): Sync with HEAD.
Kenichi Handa <handa@m17n.org>
parents: 90380
diff changeset
10916 staticpro (&system_eol_type);
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10917 }
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10918
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10919 char *
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10920 emacs_strerror (error_number)
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10921 int error_number;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10922 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10923 char *str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10924
26526
b7438760079b * callproc.c (strerror): Remove decl.
Paul Eggert <eggert@twinsun.com>
parents: 26240
diff changeset
10925 synchronize_system_messages_locale ();
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10926 str = strerror (error_number);
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10927
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10928 if (! NILP (Vlocale_coding_system))
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10929 {
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10930 Lisp_Object dec = code_convert_string_norecord (build_string (str),
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10931 Vlocale_coding_system,
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10932 0);
46370
40db0673e6f0 Most uses of XSTRING combined with STRING_BYTES or indirection changed to
Ken Raeburn <raeburn@raeburn.org>
parents: 46293
diff changeset
10933 str = (char *) SDATA (dec);
26088
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10934 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10935
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10936 return str;
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10937 }
b7aa6ac26872 Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents: 26067
diff changeset
10938
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
10939 #endif /* emacs */
29184
446621f88d68 Fix junk from last checkin.
Dave Love <fx@gnu.org>
parents: 29182
diff changeset
10940
52401
695cf19ef79e Add arch taglines
Miles Bader <miles@gnu.org>
parents: 52354
diff changeset
10941 /* arch-tag: 3a3a2b01-5ff6-4071-9afe-f5b808d9229d
695cf19ef79e Add arch taglines
Miles Bader <miles@gnu.org>
parents: 52354
diff changeset
10942 (do not change this comment) */