Mercurial > emacs
annotate lisp/language/china-util.el @ 83188:1425b1df1da8
Merged in changes from CVS trunk.
Patches applied:
* miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-482
Update from CVS
* miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-483
Build-in-place tweak
* miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-484
Update from CVS
git-archimport-id: lorentey@elte.hu--2004/emacs--multi-tty--0--patch-228
author | Karoly Lorentey <lorentey@elte.hu> |
---|---|
date | Mon, 09 Aug 2004 11:05:10 +0000 |
parents | 695cf19ef79e |
children | 197607499a29 375f2633d815 |
rev | line source |
---|---|
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
1 ;;; china-util.el --- utilities for Chinese -*- coding: iso-2022-7bit -*- |
17052 | 2 |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
3 ;; Copyright (C) 1995, 2003 Electrotechnical Laboratory, JAPAN. |
18377
8b4a66c66dd6
Change copyright notice.
Richard M. Stallman <rms@gnu.org>
parents:
18309
diff
changeset
|
4 ;; Licensed to the Free Software Foundation. |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
5 ;; Copyright (C) 1995, 2001 Free Software Foundation, Inc. |
17052 | 6 |
7 ;; Keywords: mule, multilingual, Chinese | |
8 | |
9 ;; This file is part of GNU Emacs. | |
10 | |
11 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
12 ;; it under the terms of the GNU General Public License as published by | |
13 ;; the Free Software Foundation; either version 2, or (at your option) | |
14 ;; any later version. | |
15 | |
16 ;; GNU Emacs is distributed in the hope that it will be useful, | |
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
19 ;; GNU General Public License for more details. | |
20 | |
21 ;; You should have received a copy of the GNU General Public License | |
17071 | 22 ;; along with GNU Emacs; see the file COPYING. If not, write to the |
23 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
24 ;; Boston, MA 02111-1307, USA. | |
17052 | 25 |
38414
67b464da13ec
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
28906
diff
changeset
|
26 ;;; Commentary: |
67b464da13ec
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
28906
diff
changeset
|
27 |
17052 | 28 ;;; Code: |
29 | |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
30 ;; Hz/ZW/EUC-TW encoding stuff |
17052 | 31 |
32 ;; HZ is an encoding method for Chinese character set GB2312 used | |
33 ;; widely in Internet. It is very similar to 7-bit environment of | |
34 ;; ISO-2022. The difference is that HZ uses the sequence "~{" and | |
35 ;; "~}" for designating GB2312 and ASCII respectively, hence, it | |
36 ;; doesn't uses ESC (0x1B) code. | |
37 | |
38 ;; ZW is another encoding method for Chinese character set GB2312. It | |
39 ;; encodes Chinese characters line by line by starting each line with | |
40 ;; the sequence "zW". It also uses only 7-bit as HZ. | |
41 | |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
42 ;; EUC-TW is similar to EUC-KS or EUC-JP. Its main character set is |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
43 ;; plane 1 of CNS 11643; characters of planes 2 to 7 are accessed with |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
44 ;; a single shift escape followed by three bytes: the first gives the |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
45 ;; plane, the second and third the character code. Note that characters |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
46 ;; of plane 1 are (redundantly) accessible with a single shift escape |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
47 ;; also. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
48 |
17052 | 49 ;; ISO-2022 escape sequence to designate GB2312. |
50 (defvar iso2022-gb-designation "\e$A") | |
51 ;; HZ escape sequence to designate GB2312. | |
52 (defvar hz-gb-designnation "~{") | |
53 ;; ISO-2022 escape sequence to designate ASCII. | |
54 (defvar iso2022-ascii-designation "\e(B") | |
55 ;; HZ escape sequence to designate ASCII. | |
56 (defvar hz-ascii-designnation "~}") | |
57 ;; Regexp of ZW sequence to start GB2312. | |
58 (defvar zw-start-gb "^zW") | |
59 ;; Regexp for start of GB2312 in an encoding mixture of HZ and ZW. | |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
60 (defvar hz/zw-start-gb |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
61 (concat hz-gb-designnation "\\|" zw-start-gb "\\|[^\0-\177]")) |
17052 | 62 |
63 (defvar decode-hz-line-continuation nil | |
64 "Flag to tell if we should care line continuation convention of Hz.") | |
65 | |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
66 (defconst hz-set-msb-table |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
67 (eval-when-compile |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
68 (let ((chars nil) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
69 (i 0)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
70 (while (< i 33) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
71 (push i chars) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
72 (setq i (1+ i))) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
73 (while (< i 127) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
74 (push (+ i 128) chars) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
75 (setq i (1+ i))) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
76 (apply 'string (nreverse chars))))) |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
77 |
17052 | 78 ;;;###autoload |
79 (defun decode-hz-region (beg end) | |
80 "Decode HZ/ZW encoded text in the current region. | |
81 Return the length of resulting text." | |
82 (interactive "r") | |
83 (save-excursion | |
84 (save-restriction | |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
85 (let (pos ch) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
86 (narrow-to-region beg end) |
17052 | 87 |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
88 ;; We, at first, convert HZ/ZW to `euc-china', |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
89 ;; then decode it. |
17052 | 90 |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
91 ;; "~\n" -> "\n", "~~" -> "~" |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
92 (goto-char (point-min)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
93 (while (search-forward "~" nil t) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
94 (setq ch (following-char)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
95 (if (or (= ch ?\n) (= ch ?~)) (delete-char -1))) |
17052 | 96 |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
97 ;; "^zW...\n" -> Chinese GB2312 |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
98 ;; "~{...~}" -> Chinese GB2312 |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
99 (goto-char (point-min)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
100 (setq beg nil) |
17052 | 101 (while (re-search-forward hz/zw-start-gb nil t) |
20738
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
102 (setq pos (match-beginning 0) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
103 ch (char-after pos)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
104 ;; Record the first position to start conversion. |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
105 (or beg (setq beg pos)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
106 (end-of-line) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
107 (setq end (point)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
108 (if (>= ch 128) ; 8bit GB2312 |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
109 nil |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
110 (goto-char pos) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
111 (delete-char 2) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
112 (setq end (- end 2)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
113 (if (= ch ?z) ; ZW -> euc-china |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
114 (progn |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
115 (translate-region (point) end hz-set-msb-table) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
116 (goto-char end)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
117 (if (search-forward hz-ascii-designnation |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
118 (if decode-hz-line-continuation nil end) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
119 t) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
120 (delete-char -2)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
121 (setq end (point)) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
122 (translate-region pos (point) hz-set-msb-table)))) |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
123 (if beg |
f510736ce3d1
In setup-LANGUAGE-environment functions,
Kenichi Handa <handa@m17n.org>
parents:
19428
diff
changeset
|
124 (decode-coding-region beg end 'euc-china))) |
17052 | 125 (- (point-max) (point-min))))) |
126 | |
127 ;;;###autoload | |
128 (defun decode-hz-buffer () | |
129 "Decode HZ/ZW encoded text in the current buffer." | |
130 (interactive) | |
131 (decode-hz-region (point-min) (point-max))) | |
132 | |
133 ;;;###autoload | |
134 (defun encode-hz-region (beg end) | |
135 "Encode the text in the current region to HZ. | |
136 Return the length of resulting text." | |
137 (interactive "r") | |
138 (save-excursion | |
139 (save-restriction | |
140 (narrow-to-region beg end) | |
141 | |
142 ;; "~" -> "~~" | |
143 (goto-char (point-min)) | |
144 (while (search-forward "~" nil t) (insert ?~)) | |
145 | |
146 ;; Chinese GB2312 -> "~{...~}" | |
147 (goto-char (point-min)) | |
148 (if (re-search-forward "\\cc" nil t) | |
20838
3d67d591c066
(encode-hz-region): Do not bind
Kenichi Handa <handa@m17n.org>
parents:
20738
diff
changeset
|
149 (let (pos) |
17052 | 150 (goto-char (setq pos (match-beginning 0))) |
18553
62e17ab4e33e
Use true coding system names instead of
Kenichi Handa <handa@m17n.org>
parents:
18377
diff
changeset
|
151 (encode-coding-region pos (point-max) 'iso-2022-7bit) |
17052 | 152 (goto-char pos) |
153 (while (search-forward iso2022-gb-designation nil t) | |
154 (delete-char -3) | |
155 (insert hz-gb-designnation)) | |
156 (goto-char pos) | |
157 (while (search-forward iso2022-ascii-designation nil t) | |
158 (delete-char -3) | |
159 (insert hz-ascii-designnation)))) | |
160 (- (point-max) (point-min))))) | |
161 | |
162 ;;;###autoload | |
163 (defun encode-hz-buffer () | |
164 "Encode the text in the current buffer to HZ." | |
165 (interactive) | |
166 (encode-hz-region (point-min) (point-max))) | |
167 | |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
168 ;; The following sets up a translation table (big5-to-cns) from Big 5 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
169 ;; to CNS encoding, using some auxiliary functions to make the code |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
170 ;; more readable. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
171 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
172 ;; Many kudos to Himi! The used code has been adapted from his |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
173 ;; mule-ucs package. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
174 |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
175 (eval-when-compile |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
176 (defun big5-to-flat-code (num) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
177 "Convert NUM in Big 5 encoding to a `flat code'. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
178 0xA140 will be mapped to position 0, 0xA141 to position 1, etc. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
179 There are no gaps in the flat code." |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
180 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
181 (let ((hi (/ num 256)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
182 (lo (% num 256))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
183 (+ (* 157 (- hi #xa1)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
184 (- lo (if (>= lo #xa1) 98 64))))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
185 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
186 (defun flat-code-to-big5 (num) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
187 "Convert NUM from a `flat code' to Big 5 encoding. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
188 This is the inverse function of `big5-to-flat-code'." |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
189 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
190 (let ((hi (/ num 157)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
191 (lo (% num 157))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
192 (+ (* 256 (+ hi #xa1)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
193 (+ lo (if (< lo 63) 64 98))))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
194 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
195 (defun euc-to-flat-code (num) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
196 "Convert NUM in EUC encoding (in GL representation) to a `flat code'. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
197 0x2121 will be mapped to position 0, 0x2122 to position 1, etc. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
198 There are no gaps in the flat code." |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
199 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
200 (let ((hi (/ num 256)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
201 (lo (% num 256))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
202 (+ (* 94 (- hi #x21)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
203 (- lo #x21)))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
204 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
205 (defun flat-code-to-euc (num) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
206 "Convert NUM from a `flat code' to EUC encoding (in GL representation). |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
207 The inverse function of `euc-to-flat-code'. The high and low bytes are |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
208 returned in a list." |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
209 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
210 (let ((hi (/ num 94)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
211 (lo (% num 94))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
212 (list (+ hi #x21) (+ lo #x21)))) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
213 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
214 (defun expand-euc-big5-alist (alist) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
215 "Create a translation table and fills it with data given in ALIST. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
216 Elements of ALIST can be either given as |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
217 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
218 ((euc-charset . startchar) . (big5-range-begin . big5-range-end)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
219 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
220 or as |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
221 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
222 (euc-character . big5-charcode) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
223 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
224 The former maps a range of glyphs in an EUC charset (where STARTCHAR |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
225 is in GL representation) to a certain range of Big 5 encoded |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
226 characters, the latter maps a single glyph. Glyphs which can't be |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
227 mapped will be represented with the byte 0xFF. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
228 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
229 The return value is the filled translation table." |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
230 |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
231 (let ((chartable (make-char-table 'translation-table #xFF)) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
232 char |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
233 big5 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
234 i |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
235 end |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
236 codepoint |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
237 charset) |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
238 (dolist (elem alist) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
239 (setq char (car elem) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
240 big5 (cdr elem)) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
241 (cond ((and (consp char) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
242 (consp big5)) |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
243 (setq i (big5-to-flat-code (car big5)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
244 end (big5-to-flat-code (cdr big5)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
245 codepoint (euc-to-flat-code (cdr char)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
246 charset (car char)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
247 (while (>= end i) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
248 (aset chartable |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
249 (decode-big5-char (flat-code-to-big5 i)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
250 (apply (function make-char) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
251 charset |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
252 (flat-code-to-euc codepoint))) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
253 (setq i (1+ i) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
254 codepoint (1+ codepoint)))) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
255 ((and (char-valid-p char) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
256 (numberp big5)) |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
257 (setq i (decode-big5-char big5)) |
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
258 (aset chartable i char)) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
259 (t |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
260 (error "Unknown slot type: %S" elem)))) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
261 ;; the return value |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
262 chartable))) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
263 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
264 ;; All non-CNS encodings are commented out. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
265 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
266 (define-translation-table 'big5-to-cns |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
267 (eval-when-compile |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
268 (expand-euc-big5-alist |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
269 '( |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
270 ;; Symbols |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
271 ((chinese-cns11643-1 . #x2121) . (#xA140 . #xA1F5)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
272 (?$(G"X(B . #xA1F6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
273 (?$(G"W(B . #xA1F7) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
274 ((chinese-cns11643-1 . #x2259) . (#xA1F8 . #xA2AE)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
275 ((chinese-cns11643-1 . #x2421) . (#xA2AF . #xA3BF)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
276 ;; Control codes (vendor dependent) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
277 ((chinese-cns11643-1 . #x4221) . (#xA3C0 . #xA3E0)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
278 ;; Level 1 Ideographs |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
279 ((chinese-cns11643-1 . #x4421) . (#xA440 . #xACFD)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
280 (?$(GWS(B . #xACFE) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
281 ((chinese-cns11643-1 . #x5323) . (#xAD40 . #xAFCF)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
282 ((chinese-cns11643-1 . #x5754) . (#xAFD0 . #xBBC7)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
283 ((chinese-cns11643-1 . #x6B51) . (#xBBC8 . #xBE51)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
284 (?$(GkP(B . #xBE52) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
285 ((chinese-cns11643-1 . #x6F5C) . (#xBE53 . #xC1AA)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
286 ((chinese-cns11643-1 . #x7536) . (#xC1AB . #xC2CA)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
287 (?$(Gu5(B . #xC2CB) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
288 ((chinese-cns11643-1 . #x7737) . (#xC2CC . #xC360)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
289 ((chinese-cns11643-1 . #x782E) . (#xC361 . #xC3B8)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
290 (?$(Gxe(B . #xC3B9) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
291 (?$(Gxd(B . #xC3BA) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
292 ((chinese-cns11643-1 . #x7866) . (#xC3BB . #xC455)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
293 (?$(Gx-(B . #xC456) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
294 ((chinese-cns11643-1 . #x7962) . (#xC457 . #xC67E)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
295 ;; Symbols |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
296 ((chinese-cns11643-1 . #x2621) . (#xC6A1 . #xC6BE)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
297 ;; Radicals |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
298 (?$(G'#(B . #xC6BF) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
299 (?$(G'$(B . #xC6C0) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
300 (?$(G'&(B . #xC6C1) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
301 (?$(G'((B . #xC6C2) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
302 (?$(G'-(B . #xC6C3) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
303 (?$(G'.(B . #xC6C4) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
304 (?$(G'/(B . #xC6C5) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
305 (?$(G'4(B . #xC6C6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
306 (?$(G'7(B . #xC6C7) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
307 (?$(G':(B . #xC6C8) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
308 (?$(G'<(B . #xC6C9) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
309 (?$(G'B(B . #xC6CA) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
310 (?$(G'G(B . #xC6CB) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
311 (?$(G'N(B . #xC6CC) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
312 (?$(G'S(B . #xC6CD) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
313 (?$(G'T(B . #xC6CE) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
314 (?$(G'U(B . #xC6CF) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
315 (?$(G'Y(B . #xC6D0) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
316 (?$(G'Z(B . #xC6D1) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
317 (?$(G'a(B . #xC6D2) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
318 (?$(G'f(B . #xC6D3) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
319 (?$(G()(B . #xC6D4) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
320 (?$(G(*(B . #xC6D5) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
321 (?$(G(c(B . #xC6D6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
322 (?$(G(l(B . #xC6D7) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
323 ;; Diacritical Marks |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
324 ; ((japanese-jisx0208 . #x212F) . (#xC6D8 . #xC6D9)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
325 ;; Japanese Kana Supplement |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
326 ; ((japanese-jisx0208 . #x2133) . (#xC6DA . #xC6E3)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
327 ;; Japanese Hiragana |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
328 ; ((japanese-jisx0208 . #x2421) . (#xC6E7 . #xC77A)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
329 ;; Japanese Katakana |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
330 ; ((japanese-jisx0208 . #x2521) . (#xC77B . #xC7F2)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
331 ;; Cyrillic Characters |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
332 ; ((japanese-jisx0208 . #x2721) . (#xC7F3 . #xC854)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
333 ; ((japanese-jisx0208 . #x2751) . (#xC855 . #xC875)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
334 ;; Special Chinese Characters |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
335 (?$(J!#(B . #xC879) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
336 (?$(J!$(B . #xC87B) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
337 (?$(J!*(B . #xC87D) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
338 (?$(J!R(B . #xC8A2) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
339 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
340 ;; JIS X 0208 NOT SIGN (cf. U+00AC) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
341 ; (?$B"L(B . #xC8CD) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
342 ;; JIS X 0212 BROKEN BAR (cf. U+00A6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
343 ; (?$(D"C(B . #xC8CE) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
344 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
345 ;; GB 2312 characters |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
346 ; (?$A!d(B . #xC8CF) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
347 ; (?$A!e(B . #xC8D0) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
348 ;;;;; C8D1 - Japanese `($B3t(B)' |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
349 ; (?$A!m(B . #xC8D2) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
350 ;;;;; C8D2 - Tel. |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
351 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
352 ;; Level 2 Ideographs |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
353 ((chinese-cns11643-2 . #x2121) . (#xC940 . #xC949)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
354 (?$(GDB(B . #xC94A);; a duplicate of #xA461 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
355 ((chinese-cns11643-2 . #x212B) . (#xC94B . #xC96B)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
356 ((chinese-cns11643-2 . #x214D) . (#xC96C . #xC9BD)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
357 (?$(H!L(B . #xC9BE) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
358 ((chinese-cns11643-2 . #x217D) . (#xC9BF . #xC9EC)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
359 ((chinese-cns11643-2 . #x224E) . (#xC9ED . #xCAF6)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
360 (?$(H"M(B . #xCAF7) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
361 ((chinese-cns11643-2 . #x2439) . (#xCAF8 . #xD6CB)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
362 (?$(H>c(B . #xD6CC) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
363 ((chinese-cns11643-2 . #x3770) . (#xD6CD . #xD779)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
364 (?$(H?j(B . #xD77A) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
365 ((chinese-cns11643-2 . #x387E) . (#xD77B . #xDADE)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
366 (?$(H7o(B . #xDADF) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
367 ((chinese-cns11643-2 . #x3E64) . (#xDAE0 . #xDBA6)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
368 ((chinese-cns11643-2 . #x3F6B) . (#xDBA7 . #xDDFB)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
369 (?$(HAv(B . #xDDFC);; a duplicate of #xDCD1 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
370 ((chinese-cns11643-2 . #x4424) . (#xDDFD . #xE8A2)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
371 ((chinese-cns11643-2 . #x554C) . (#xE8A3 . #xE975)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
372 ((chinese-cns11643-2 . #x5723) . (#xE976 . #xEB5A)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
373 ((chinese-cns11643-2 . #x5A29) . (#xEB5B . #xEBF0)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
374 (?$(HUK(B . #xEBF1) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
375 ((chinese-cns11643-2 . #x5B3F) . (#xEBF2 . #xECDD)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
376 (?$(HW"(B . #xECDE) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
377 ((chinese-cns11643-2 . #x5C6A) . (#xECDF . #xEDA9)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
378 ((chinese-cns11643-2 . #x5D75) . (#xEDAA . #xEEEA)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
379 (?$(Hd/(B . #xEEEB) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
380 ((chinese-cns11643-2 . #x6039) . (#xEEEC . #xF055)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
381 (?$(H]t(B . #xF056) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
382 ((chinese-cns11643-2 . #x6243) . (#xF057 . #xF0CA)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
383 (?$(HZ((B . #xF0CB) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
384 ((chinese-cns11643-2 . #x6337) . (#xF0CC . #xF162)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
385 ((chinese-cns11643-2 . #x6430) . (#xF163 . #xF16A)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
386 (?$(Hga(B . #xF16B) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
387 ((chinese-cns11643-2 . #x6438) . (#xF16C . #xF267)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
388 (?$(Hi4(B . #xF268) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
389 ((chinese-cns11643-2 . #x6573) . (#xF269 . #xF2C2)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
390 ((chinese-cns11643-2 . #x664E) . (#xF2C3 . #xF374)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
391 ((chinese-cns11643-2 . #x6762) . (#xF375 . #xF465)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
392 ((chinese-cns11643-2 . #x6935) . (#xF466 . #xF4B4)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
393 (?$(HfM(B . #xF4B5) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
394 ((chinese-cns11643-2 . #x6962) . (#xF4B6 . #xF4FC)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
395 ((chinese-cns11643-2 . #x6A4C) . (#xF4FD . #xF662)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
396 (?$(HjK(B . #xF663) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
397 ((chinese-cns11643-2 . #x6C52) . (#xF664 . #xF976)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
398 ((chinese-cns11643-2 . #x7167) . (#xF977 . #xF9C3)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
399 (?$(Hqf(B . #xF9C4) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
400 (?$(Hr4(B . #xF9C5) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
401 (?$(Hr@(B . #xF9C6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
402 ((chinese-cns11643-2 . #x7235) . (#xF9C7 . #xF9D1)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
403 ((chinese-cns11643-2 . #x7241) . (#xF9D2 . #xF9D5)) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
404 |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
405 ;; Additional Ideographs |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
406 (?$(IC7(B . #xF9D6) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
407 (?$(IOP(B . #xF9D7) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
408 (?$(IDN(B . #xF9D8) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
409 (?$(IPJ(B . #xF9D9) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
410 (?$(I,](B . #xF9DA) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
411 (?$(I=~(B . #xF9DB) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
412 (?$(IK\(B . #xF9DC) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
413 ) |
51079
bd6dedbdc53f
(hz-set-msb-table): Build when compiling.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
42153
diff
changeset
|
414 )) |
42153
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
415 ) |
ca6dbe4635da
Implementing euc-tw encoding.
Werner LEMBERG <wl@gnu.org>
parents:
38414
diff
changeset
|
416 |
17052 | 417 ;; |
18309
bd8b521f5218
Provide XXX-util instead of
Kenichi Handa <handa@m17n.org>
parents:
17993
diff
changeset
|
418 (provide 'china-util) |
17052 | 419 |
52401 | 420 ;;; arch-tag: 5a47b084-b9ac-420e-8191-70c5b3a14836 |
17052 | 421 ;;; china-util.el ends here |