Mercurial > emacs
annotate lisp/language/chinese.el @ 20399:04ce86b23ffa
(rmail-decode-quoted-printable): New function
mostly copied from gnus-art.el.
(rmail-hex-string-to-integer): New fn, copied from hexl.el.
(rmail-hex-char-to-integer): Likewise.
(rmail-convert-to-babyl-format): Use rmail-decode-quoted-printable.
author | Karl Heuer <kwzh@gnu.org> |
---|---|
date | Thu, 04 Dec 1997 04:32:03 +0000 |
parents | 36eb3e583396 |
children | 5d6f4b0c2763 |
rev | line source |
---|---|
17052 | 1 ;;; chinese.el --- Support for Chinese |
2 | |
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN. | |
18377
8b4a66c66dd6
Change copyright notice.
Richard M. Stallman <rms@gnu.org>
parents:
18309
diff
changeset
|
4 ;; Licensed to the Free Software Foundation. |
17052 | 5 |
6 ;; Keywords: multilingual, Chinese | |
7 | |
8 ;; This file is part of GNU Emacs. | |
9 | |
10 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
11 ;; it under the terms of the GNU General Public License as published by | |
12 ;; the Free Software Foundation; either version 2, or (at your option) | |
13 ;; any later version. | |
14 | |
15 ;; GNU Emacs is distributed in the hope that it will be useful, | |
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
18 ;; GNU General Public License for more details. | |
19 | |
20 ;; You should have received a copy of the GNU General Public License | |
17071 | 21 ;; along with GNU Emacs; see the file COPYING. If not, write to the |
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
23 ;; Boston, MA 02111-1307, USA. | |
17052 | 24 |
25 ;;; Commentary: | |
26 | |
27 ;; For Chinese, three character sets GB2312, BIG5, and CNS11643 are | |
28 ;; supported. | |
29 | |
30 ;;; Code: | |
31 | |
32 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
33 ;;; Chinese (general) | |
34 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
35 | |
36 (make-coding-system | |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
37 'chinese-iso-7bit 2 ?C |
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
38 "ISO 2022 based 7bit encoding for Chinese GB and CNS (MIME:ISO-2022-CN)" |
17052 | 39 '(ascii |
40 (nil chinese-gb2312 chinese-cns11643-1) | |
41 (nil chinese-cns11643-2) | |
42 (nil chinese-cns11643-3 chinese-cns11643-4 chinese-cns11643-5 | |
43 chinese-cns11643-6 chinese-cns11643-7) | |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
44 nil ascii-eol ascii-cntl seven locking-shift single-shift nil nil nil |
20158
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
45 init-bol) |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
46 '(ascii chinese-gb2312 chinese-cns11643-1 chinese-cns11643-2 |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
47 chinese-cns11643-3 chinese-cns11643-4 chinese-cns11643-5 |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
48 chinese-cns11643-6 chinese-cns11643-7)) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
49 |
18520
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
50 (define-coding-system-alias 'iso-2022-cn 'chinese-iso-7bit) |
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
51 (define-coding-system-alias 'iso-2022-cn-ext 'chinese-iso-7bit) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
52 |
18156
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
53 (define-prefix-command 'describe-chinese-environment-map) |
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
54 (define-key-after describe-language-environment-map [Chinese] |
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
55 '("Chinese" . describe-chinese-environment-map) |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
56 t) |
17052 | 57 |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
58 (define-prefix-command 'setup-chinese-environment-map) |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
59 (define-key-after setup-language-environment-map [Chinese] |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
60 '("Chinese" . setup-chinese-environment-map) |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
61 t) |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
62 |
17052 | 63 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; |
64 ;;; Chinese GB2312 (simplified) | |
65 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
66 | |
67 (make-coding-system | |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
68 'chinese-iso-8bit 2 ?c |
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
69 "ISO 2022 based EUC encoding for Chinese GB2312 (MIME:CN-GB-2312)" |
17052 | 70 '((ascii t) chinese-gb2312 chinese-sisheng nil |
20158
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
71 nil ascii-eol ascii-cntl nil nil single-shift nil) |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
72 '(ascii chinese-gb2312 chinese-sisheng)) |
17052 | 73 |
18520
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
74 (define-coding-system-alias 'cn-gb-2312 'chinese-iso-8bit) |
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
75 (define-coding-system-alias 'euc-china 'chinese-iso-8bit) |
20158
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
76 (define-coding-system-alias 'euc-cn 'chinese-iso-8bit) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
77 |
17052 | 78 (make-coding-system |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
79 'chinese-hz 0 ?z |
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
80 "Hz/ZW 7-bit encoding for Chinese GB2312 (MIME:HZ-GB-2312)" |
20158
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
81 nil |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
82 '(ascii chinese-gb2312)) |
20109
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
83 (coding-system-put 'chinese-hz 'post-read-conversion 'post-read-decode-hz) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
84 (coding-system-put 'chinese-hz 'pre-write-conversion 'pre-write-encode-hz) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
85 |
18520
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
86 (define-coding-system-alias 'hz-gb-2312 'chinese-hz) |
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
87 (define-coding-system-alias 'hz 'chinese-hz) |
17052 | 88 |
89 (defun post-read-decode-hz (len) | |
20109
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
90 (let ((pos (point)) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
91 (buffer-modified-p (buffer-modified-p)) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
92 last-coding-system-used) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
93 (prog1 |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
94 (decode-hz-region pos (+ pos len)) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
95 (set-buffer-modified-p buffer-modified-p)))) |
17052 | 96 |
97 (defun pre-write-encode-hz (from to) | |
98 (let ((buf (current-buffer)) | |
99 (work (get-buffer-create " *pre-write-encoding-work*"))) | |
100 (set-buffer work) | |
101 (erase-buffer) | |
17765
9c4845e8101d
Make functions setup-LANGUAGE-environment
Kenichi Handa <handa@m17n.org>
parents:
17084
diff
changeset
|
102 (if (stringp from) |
9c4845e8101d
Make functions setup-LANGUAGE-environment
Kenichi Handa <handa@m17n.org>
parents:
17084
diff
changeset
|
103 (insert from) |
9c4845e8101d
Make functions setup-LANGUAGE-environment
Kenichi Handa <handa@m17n.org>
parents:
17084
diff
changeset
|
104 (insert-buffer-substring buf from to)) |
20109
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
105 (let (last-coding-system-used) |
b68cac3f8e3a
Use coding-system-put to set coding system
Kenichi Handa <handa@m17n.org>
parents:
18520
diff
changeset
|
106 (encode-hz-region 1 (point-max))) |
17052 | 107 nil)) |
108 | |
109 (set-language-info-alist | |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
110 "Chinese-GB" '((setup-function . (setup-chinese-gb-environment |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
111 . setup-chinese-environment-map)) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
112 (charset . (chinese-gb2312 chinese-sisheng)) |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
113 (coding-system |
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
114 . (chinese-iso-8bit chinese-iso-7bit chinese-hz)) |
17765
9c4845e8101d
Make functions setup-LANGUAGE-environment
Kenichi Handa <handa@m17n.org>
parents:
17084
diff
changeset
|
115 (sample-text . "Chinese ($AVPND(B,$AFUM(;0(B,$A::So(B) $ADc:C(B") |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
116 (documentation . ("Support for Chinese GB2312 character set." |
18156
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
117 . describe-chinese-environment-map)) |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
118 )) |
17052 | 119 |
120 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
121 ;; Chinese BIG5 (traditional) | |
122 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
123 | |
124 (make-coding-system | |
20158
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
125 'chinese-big5 3 ?B "BIG5 8-bit encoding for Chinese (MIME:CN-BIG5)" |
36eb3e583396
Give proper SAFE-CHARSET argument in each
Kenichi Handa <handa@m17n.org>
parents:
20109
diff
changeset
|
126 nil '(chinese-big5-1 chinese-big5-2)) |
17052 | 127 |
18520
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
128 (define-coding-system-alias 'big5 'chinese-big5) |
383d11185239
Swap args to define-coding-system-alias.
Richard M. Stallman <rms@gnu.org>
parents:
18377
diff
changeset
|
129 (define-coding-system-alias 'cn-big5 'chinese-big5) |
17084
07f0a1e07d1e
Add INIT-BOL to coding system iso-2022-cn.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
130 |
17052 | 131 ;; Big5 font requires special encoding. |
132 (define-ccl-program ccl-encode-big5-font | |
133 `(0 | |
134 ;; In: R0:chinese-big5-1 or chinese-big5-2 | |
135 ;; R1:position code 1 | |
136 ;; R2:position code 2 | |
137 ;; Out: R1:font code point 1 | |
138 ;; R2:font code point 2 | |
139 ((r2 = ((((r1 - ?\x21) * 94) + r2) - ?\x21)) | |
140 (if (r0 == ,(charset-id 'chinese-big5-2)) (r2 += 6280)) | |
141 (r1 = ((r2 / 157) + ?\xA1)) | |
142 (r2 %= 157) | |
143 (if (r2 < ?\x3F) (r2 += ?\x40) (r2 += ?\x62)))) | |
144 "CCL program to encode a Big5 code to code point of Big5 font.") | |
145 | |
146 (setq font-ccl-encoder-alist | |
147 (cons (cons "big5" ccl-encode-big5-font) font-ccl-encoder-alist)) | |
148 | |
149 (set-language-info-alist | |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
150 "Chinese-BIG5" '((setup-function . (setup-chinese-big5-environment |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
151 . setup-chinese-environment-map)) |
17052 | 152 (charset . (chinese-big5-1 chinese-big5-2)) |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
153 (coding-system . (chinese-big5 chinese-iso-7bit)) |
17765
9c4845e8101d
Make functions setup-LANGUAGE-environment
Kenichi Handa <handa@m17n.org>
parents:
17084
diff
changeset
|
154 (sample-text . "Cantonese ($(0GnM$(B,$(0N]0*Hd(B) $(0*/=((B, $(0+$)p(B") |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
155 (documentation . ("Support for Chinese Big5 character set." |
18156
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
156 . describe-chinese-environment-map)) |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
157 )) |
17052 | 158 |
159 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
160 ;; Chinese CNS11643 (traditional) | |
161 ;;;;;;;;;;;;;;;;;;;;;;;;;;;;;; | |
162 | |
163 (set-language-info-alist | |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
164 "Chinese-CNS" '((setup-function . (setup-chinese-cns-environment |
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
165 . setup-chinese-environment-map)) |
17052 | 166 (charset . (chinese-cns11643-1 chinese-cns11643-2 |
167 chinese-cns11643-3 chinese-cns11643-4 | |
168 chinese-cns11643-5 chinese-cns11643-6 | |
169 chinese-cns11643-7)) | |
18203
0745f30aec66
Adjusted for coding system name change.
Kenichi Handa <handa@m17n.org>
parents:
18156
diff
changeset
|
170 (coding-system . (chinese-iso-7bit)) |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
171 (documentation . ("Support for Chinese CNS character sets." |
18156
f7296dc03177
(describe-chinese-environment-map):
Richard M. Stallman <rms@gnu.org>
parents:
17993
diff
changeset
|
172 . describe-chinese-environment-map)) |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17841
diff
changeset
|
173 )) |
17052 | 174 |
175 ;;; chinese.el ends here |