Mercurial > emacs
annotate lisp/international/codepage.el @ 63092:80ef8a2a052d
(debug): Don't bury the buffer unless it's in a dedicated window.
| author | Stefan Monnier <monnier@iro.umontreal.ca> |
|---|---|
| date | Mon, 06 Jun 2005 19:47:05 +0000 |
| parents | c36561fe0657 |
| children | 18a818a2ee7c f042e7c0fe20 |
| rev | line source |
|---|---|
|
38412
253f761ad37b
Some fixes to follow coding conventions in files maintained by FSF.
Pavel Jan?k <Pavel@Janik.cz>
parents:
36579
diff
changeset
|
1 ;;; codepage.el --- MS-DOS/MS-Windows specific coding systems |
| 23915 | 2 |
| 62274 | 3 ;; Copyright (C) 1998, 1999, 2000, 2002 Free Software Foundation, Inc. |
| 4 ;; Copyright (C) 2000 | |
| 5 ;; National Institute of Advanced Industrial Science and Technology (AIST) | |
| 6 ;; Registration Number H14PRO021 | |
| 23915 | 7 |
| 8 ;; Author: Eli Zaretskii | |
| 9 ;; Maintainer: FSF | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
10 ;; Keywords: i18n ms-dos ms-windows codepage |
| 23915 | 11 |
| 12 ;; This file is part of GNU Emacs. | |
| 13 | |
| 14 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
| 15 ;; it under the terms of the GNU General Public License as published by | |
| 16 ;; the Free Software Foundation; either version 2, or (at your option) | |
| 17 ;; any later version. | |
| 18 | |
| 19 ;; GNU Emacs is distributed in the hope that it will be useful, | |
| 20 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
| 21 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
| 22 ;; GNU General Public License for more details. | |
| 23 | |
| 24 ;; You should have received a copy of the GNU General Public License | |
| 25 ;; along with GNU Emacs; see the file COPYING. If not, write to the | |
| 26 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
| 27 ;; Boston, MA 02111-1307, USA. | |
| 28 | |
| 29 ;;; Commentary: | |
| 30 | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
31 ;; Special coding systems for DOS/Windows codepage support. |
| 23915 | 32 ;; |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
33 ;; These coding systems perform conversion from the DOS/Windows |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
34 ;; codepage encoding to one of the ISO-8859 character sets. Each |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
35 ;; codepage has its corresponding ISO-8859 charset, chosen so as to be |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
36 ;; able to convert all (or most) of the characters. The idea is that |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
37 ;; Emacs internally works with the usual MULE charsets, and the |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
38 ;; conversion to and from the DOS codepage is performed on I/O only. |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
39 ;; See term/internal.el for the complementary setup of the DOS |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
40 ;; terminal display and input methods. |
| 23915 | 41 ;; |
| 42 ;; Thanks to Ken'ichi Handa <handa@etl.go.jp> for writing the CCL | |
|
49598
0d8b17d428b5
Trailing whitepace deleted.
Juanma Barranquero <lekktu@gmail.com>
parents:
48363
diff
changeset
|
43 ;; encoders/decoders, and for help in debugging this code. |
| 23915 | 44 |
| 45 ;;; Code: | |
| 46 | |
| 47 (defun cp-coding-system-for-codepage-1 (coding mnemonic iso-name | |
| 48 decoder encoder) | |
| 49 "Make coding system CODING for a DOS codepage using translation tables. | |
| 50 MNEMONIC is a character to be displayed on mode line for the coding system. | |
| 51 ISO-NAME is the name of the ISO-8859 charset which corresponds to this | |
| 52 codepage. | |
| 53 DECODER is a translation table for converting characters in the DOS codepage | |
| 54 encoding to Emacs multibyte characters. | |
| 55 ENCODER is a translation table for encoding Emacs multibyte characters into | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
56 external DOS codepage codes." |
| 23915 | 57 (save-match-data |
| 58 (let* ((coding-name (symbol-name coding)) | |
|
24279
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
59 (undef (if (eq system-type 'ms-dos) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
60 (if dos-unsupported-char-glyph |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
61 (logand dos-unsupported-char-glyph 255) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
62 127) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
63 ??)) |
|
30493
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
64 (safe-chars (make-char-table 'safe-chars)) |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
65 (ccl-decoder |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
66 (ccl-compile |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
67 ;; The 4 here supplies the buf_magnification parameter |
|
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
68 ;; for the CCL program. A multibyte character may take |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
69 ;; at most 4-bytes. |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
70 `(4 (loop (read r1) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
71 (if (r1 >= 128) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
72 ((r0 = ,(charset-id 'ascii)) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
73 (translate-character ,decoder r0 r1) |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
74 (write-multibyte-character r0 r1)) |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
75 (write r1)) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
76 (repeat))))) |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
77 (ccl-encoder |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
78 (ccl-compile |
|
24662
5d61c3793c06
(cp-coding-system-for-codepage-1):
Andrew Innes <andrewi@gnu.org>
parents:
24454
diff
changeset
|
79 ;; The 2 here supplies the buf_magnification parameter for |
|
5d61c3793c06
(cp-coding-system-for-codepage-1):
Andrew Innes <andrewi@gnu.org>
parents:
24454
diff
changeset
|
80 ;; the CCL program. Since the -dos coding system generates |
|
5d61c3793c06
(cp-coding-system-for-codepage-1):
Andrew Innes <andrewi@gnu.org>
parents:
24454
diff
changeset
|
81 ;; \r\n for each \n, a factor of 2 covers even the worst case |
|
5d61c3793c06
(cp-coding-system-for-codepage-1):
Andrew Innes <andrewi@gnu.org>
parents:
24454
diff
changeset
|
82 ;; of empty lines with a single \n. |
|
5d61c3793c06
(cp-coding-system-for-codepage-1):
Andrew Innes <andrewi@gnu.org>
parents:
24454
diff
changeset
|
83 `(2 (loop (read-multibyte-character r0 r1) |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
84 (if (r0 != ,(charset-id 'ascii)) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
85 ((translate-character ,encoder r0 r1) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
86 (if (r0 == ,(charset-id 'japanese-jisx0208)) |
|
24279
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
87 ((r1 = ,undef) |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
88 (write r1))))) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
89 (write-repeat r1)))))) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
90 |
|
30493
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
91 ;; Set elements of safe multibyte characters for this codepage |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
92 ;; to t in the char-table safe-chars. |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
93 (let ((tbl (get decoder 'translation-table)) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
94 (i 128) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
95 ch) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
96 (while (< i 256) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
97 (setq ch (aref tbl i)) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
98 (if ch (aset safe-chars ch t)) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
99 (setq i (1+ i)))) |
|
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
100 |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
101 ;; Make coding system CODING. |
| 23915 | 102 (make-coding-system |
| 103 coding 4 mnemonic | |
| 104 (concat "8-bit encoding of " (symbol-name iso-name) | |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
105 " characters using IBM codepage " coding-name) |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
106 (cons ccl-decoder ccl-encoder) |
|
29258
aa05ee69de27
(cp-coding-system-for-codepage-1): Add
Eli Zaretskii <eliz@gnu.org>
parents:
29189
diff
changeset
|
107 `((safe-charsets ascii eight-bit-control eight-bit-graphic ,iso-name) |
|
30493
6ca8f913d1df
(cp-coding-system-for-codepage-1): Give `safe-chars' property to
Kenichi Handa <handa@m17n.org>
parents:
29922
diff
changeset
|
108 (safe-chars . ,safe-chars) |
|
29721
b722da8919f6
(cp-coding-system-for-codepage-1): Delete special codes for
Kenichi Handa <handa@m17n.org>
parents:
29258
diff
changeset
|
109 (valid-codes (0 . 255))))))) |
| 23915 | 110 |
| 111 (defun cp-decoding-vector-for-codepage (table charset offset) | |
| 112 "Create a vector for decoding IBM PC characters using conversion table | |
| 113 TABLE into an ISO-8859 character set CHARSET whose first non-ASCII | |
| 24033 | 114 character is generated by (make-char CHARSET OFFSET)." |
| 23915 | 115 (let* ((len (length table)) |
| 116 (undefined-char | |
| 117 (if (eq system-type 'ms-dos) | |
| 118 (if dos-unsupported-char-glyph | |
| 119 (logand dos-unsupported-char-glyph 255) | |
| 120 127) | |
| 121 32)) | |
| 122 (vec1 (make-vector 256 undefined-char)) | |
| 123 (i 0)) | |
|
29189
59e5b57b10db
(cp-decoding-vector-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
29180
diff
changeset
|
124 (while (< i 256) |
| 23915 | 125 (aset vec1 i i) |
| 126 (setq i (1+ i))) | |
| 127 (setq i 0) | |
| 128 (while (< i len) | |
| 129 (if (aref table i) | |
| 130 (aset vec1 (aref table i) (make-char charset (+ i offset)))) | |
| 131 (setq i (1+ i))) | |
| 132 vec1)) | |
| 133 | |
| 134 ;;; You don't think I created all these tables below by hand, do you? | |
| 135 ;;; The following Awk script will create the table for cp850-to-Latin-1 | |
| 136 ;;; conversion from the RFC 1345 file (the other tables are left as an | |
| 137 ;;; excercise): | |
| 138 ;;; BEGIN { n_pages = 11; | |
| 139 ;;; pn["IBM437"] = 0; pn["IBM850"] = 1; pn["IBM851"] = 2; | |
| 140 ;;; pn["IBM852"] = 3; pn["IBM855"] = 4; pn["IBM860"] = 5; | |
| 141 ;;; pn["IBM861"] = 6; pn["IBM862"] = 7; pn["IBM863"] = 8; | |
| 142 ;;; pn["IBM864"] = 9; pn["IBM865"] = 10; | |
| 143 ;;; } | |
| 144 ;;; $1 == "&charset" { charset = $2; } | |
| 145 ;;; $1 == "&code" { code = $2; } | |
| 146 ;;; /^ [^&]/ { | |
| 147 ;;; if ((charset ~ /^IBM(437|8(5[0125]|6[0-5]))$/) || (charset ~ /^ISO_8859-1/)) | |
| 148 ;;; { | |
| 149 ;;; for (i = 1; i <= NF; i++) | |
| 150 ;;; chars[charset,code++] = $i; | |
| 151 ;;; } | |
| 152 ;;; } | |
| 153 ;;; | |
| 154 ;;; END { | |
| 155 ;;; for (i = 160; i < 256; i++) | |
| 156 ;;; { | |
| 157 ;;; c = chars["ISO_8859-1:1987",i]; | |
| 158 ;;; if (c == "??") # skip unused positions | |
| 159 ;;; { | |
| 160 ;;; printf " nil"; | |
| 161 ;;; if ((i - 159)%16 == 0) | |
| 162 ;;; printf "\n"; | |
| 163 ;;; continue; | |
| 164 ;;; } | |
| 165 ;;; found = 0; | |
| 166 ;;; for (j in pn) | |
| 167 ;;; map[j] = "nil"; | |
| 168 ;;; for (combined in chars) | |
| 169 ;;; { | |
| 170 ;;; candidate = chars[combined]; | |
| 171 ;;; split (combined, separate, SUBSEP); | |
| 172 ;;; if (separate[1] == "IBM850" && candidate == c) | |
| 173 ;;; { | |
| 174 ;;; found = 1; | |
| 175 ;;; map[separate[1]] = separate[2]; | |
| 176 ;;; } | |
| 177 ;;; } | |
| 178 ;;; printf " %s", map["IBM850"]; | |
| 179 ;;; if ((i - 159)%16 == 0) | |
| 180 ;;; printf "\n"; | |
| 181 ;;; } | |
| 182 ;;; } | |
| 183 | |
| 184 ;;; WARNING WARNING WARNING!!! | |
| 185 ;;; | |
| 186 ;;; If you want to get fancy with these tables, remember that the inverse | |
| 187 ;;; tables, created by `cp-decoding-vector-for-codepage' above, are installed | |
| 188 ;;; on MS-DOS as nonascii-translation-table (see `dos-codepage-setup' on | |
| 189 ;;; internal.el). Therefore, you should NOT put any codes below 128 in | |
| 190 ;;; these tables! Otherwise, various Emacs commands and functions will | |
| 191 ;;; mysteriously fail! For example, a typical screwup is to map the Latin-N | |
| 192 ;;; acute accent character to the apostrophe, and have all regexps which | |
| 193 ;;; end with "\\'" begin to fail (e.g., the automatic setting of the major | |
| 194 ;;; mode by file name extension will stop working). | |
| 195 ;;; | |
| 196 ;;; You HAVE BEEN warned! | |
| 197 | |
| 198 ;; US/English/PC-8/IBM-2. This doesn't support Latin-1 characters very | |
| 199 ;; well, but why not use what we can salvage? | |
| 200 (defvar cp437-decode-table | |
| 201 ;; Nth element is the code of a cp437 glyph for the multibyte | |
| 202 ;; character created by (make-char 'latin-iso8859-1 (+ N 160)). | |
|
24064
e4cc744bdce5
(cp850-decode-table): Replace nil
Eli Zaretskii <eliz@gnu.org>
parents:
24033
diff
changeset
|
203 ;; The element nil means there's no corresponding cp437 glyph. |
| 23915 | 204 [ |
| 205 255 173 155 156 nil 157 179 nil nil nil 166 174 170 196 nil nil | |
| 206 248 241 253 nil nil nil nil 249 nil nil 167 175 172 171 nil 168 | |
| 207 nil nil nil nil 142 143 146 128 nil 144 nil nil nil nil nil nil | |
| 208 nil 165 nil nil nil nil 153 nil nil nil nil nil 154 nil nil 225 | |
| 209 133 160 131 nil 132 134 145 135 138 130 136 137 141 161 140 139 | |
| 210 nil 164 149 162 147 nil 148 246 nil 151 163 150 129 nil nil 152] | |
| 211 "Table for converting ISO-8859-1 characters into codepage 437 glyphs.") | |
| 212 (setplist 'cp437-decode-table | |
| 213 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 214 | |
| 215 ;; Multilingual (Latin-1) | |
| 216 (defvar cp850-decode-table | |
| 217 ;; Nth element is the code of a cp850 glyph for the multibyte | |
| 218 ;; character created by (make-char 'latin-iso8859-1 (+ N 160)). | |
| 219 ;; The element nil means there's no corresponding cp850 glyph. | |
| 220 [ | |
|
24072
749d25833f30
(cp850-decode-table): Fix previous change.
Eli Zaretskii <eliz@gnu.org>
parents:
24064
diff
changeset
|
221 255 173 189 156 207 190 221 245 249 184 166 174 170 240 169 nil |
|
24085
8dc3b068c0db
(cp855-decode-table, cp850-decode-table): Fill some nil entries.
Eli Zaretskii <eliz@gnu.org>
parents:
24072
diff
changeset
|
222 248 241 253 252 239 230 244 250 247 251 167 175 172 171 243 168 |
| 23915 | 223 183 181 182 199 142 143 146 128 212 144 210 211 222 214 215 216 |
| 224 209 165 227 224 226 229 153 158 157 235 233 234 154 237 231 225 | |
| 225 133 160 131 198 132 134 145 135 138 130 136 137 141 161 140 139 | |
| 226 208 164 149 162 147 228 148 246 155 151 163 150 129 236 232 152] | |
| 227 "Table for converting ISO-8859-1 characters into codepage 850 glyphs.") | |
| 228 (setplist 'cp850-decode-table | |
| 229 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 230 | |
| 231 ;; Greek | |
| 232 (defvar cp851-decode-table | |
| 233 [ | |
| 234 255 nil nil 156 nil nil nil 245 249 nil nil 174 nil 240 nil nil | |
| 235 248 241 nil nil 239 nil 134 nil 141 143 144 175 146 171 149 152 | |
| 236 161 164 165 166 167 168 169 170 172 173 181 182 184 183 189 190 | |
| 237 198 199 nil 207 208 209 210 211 212 213 nil nil 155 157 158 159 | |
| 238 252 214 215 216 221 222 224 225 226 227 228 229 230 231 232 233 | |
| 239 234 235 237 236 238 242 243 244 246 250 160 251 162 163 253 nil] | |
| 240 "Table for converting ISO-8859-7 characters into codepage 851 glyphs.") | |
| 241 (setplist 'cp851-decode-table | |
| 242 '(charset greek-iso8859-7 language "Greek" offset 160)) | |
| 243 | |
| 244 ;; Slavic/Eastern Europe (Latin-2) | |
| 245 (defvar cp852-decode-table | |
| 246 [ | |
| 247 255 164 244 157 207 149 151 245 249 230 184 155 141 240 166 189 | |
| 248 248 165 247 136 239 150 152 243 242 231 173 156 171 241 167 190 | |
|
24088
bb95d3d24ff9
(cp852-decode-table): Fill a nil entry.
Eli Zaretskii <eliz@gnu.org>
parents:
24085
diff
changeset
|
249 232 181 182 198 142 145 143 128 172 144 168 211 183 214 215 210 |
| 23915 | 250 209 227 213 224 226 138 153 158 252 222 233 235 154 237 221 225 |
| 251 234 160 131 199 132 146 134 135 159 130 169 137 216 161 140 212 | |
| 252 208 228 229 162 147 139 148 246 253 133 163 251 129 236 238 250] | |
| 253 "Table for converting ISO-8859-2 characters into codepage 852 glyphs.") | |
| 254 (setplist 'cp852-decode-table | |
| 255 '(charset latin-iso8859-2 language "Latin-2" offset 160)) | |
| 256 | |
| 257 ;; Russian | |
| 258 (defvar cp855-decode-table | |
| 259 [ | |
|
24085
8dc3b068c0db
(cp855-decode-table, cp850-decode-table): Fill some nil entries.
Eli Zaretskii <eliz@gnu.org>
parents:
24072
diff
changeset
|
260 255 133 129 131 135 137 139 141 143 145 147 149 151 240 153 155 |
| 23915 | 261 161 163 236 173 167 169 234 244 184 190 199 209 211 213 215 221 |
| 262 226 228 230 232 171 182 165 252 246 250 159 242 238 248 157 224 | |
| 263 160 162 235 172 166 168 233 243 183 189 198 208 210 212 214 216 | |
| 264 225 227 229 231 170 181 164 251 245 249 158 241 237 247 156 222 | |
|
24085
8dc3b068c0db
(cp855-decode-table, cp850-decode-table): Fill some nil entries.
Eli Zaretskii <eliz@gnu.org>
parents:
24072
diff
changeset
|
265 239 132 128 130 134 136 138 140 142 144 146 148 150 253 152 154] |
| 23915 | 266 "Table for converting ISO-8859-5 characters into codepage 855 glyphs.") |
| 267 (setplist 'cp855-decode-table | |
| 268 '(charset cyrillic-iso8859-5 language "Cyrillic-ISO" offset 160)) | |
| 269 | |
| 270 ;; Turkish | |
| 271 (defvar cp857-decode-table | |
| 272 [ | |
| 273 255 nil nil 156 207 nil 245 249 152 158 166 nil 240 nil | |
| 274 248 nil 253 252 239 nil nil nil nil 141 159 167 nil 171 nil | |
| 275 183 181 182 142 nil nil 128 212 144 210 211 222 214 215 216 | |
| 276 165 227 224 226 nil 153 232 nil 235 233 234 154 nil nil 225 | |
| 277 133 160 131 132 nil nil 135 138 130 136 137 236 161 140 139 | |
| 278 164 149 162 147 nil 148 246 nil 151 163 150 129 nil nil 250] | |
| 279 "Table for converting ISO-8859-3 characters into codepage 857 glyphs.") | |
| 280 (setplist 'cp857-decode-table | |
| 281 '(charset latin-iso8859-3 language "Latin-3" offset 160)) | |
| 282 | |
| 283 ;; Portuguese | |
| 284 (defvar cp860-decode-table | |
| 285 [ | |
| 286 255 173 155 156 nil nil 179 nil nil nil 166 174 170 nil nil nil | |
| 287 nil 241 253 nil nil nil nil 249 nil nil 167 175 172 171 nil 168 | |
| 288 145 134 143 142 nil nil nil 128 146 144 137 nil 152 nil 139 nil | |
| 289 nil 165 159 169 140 153 nil nil nil 157 150 nil 154 nil nil nil | |
| 290 133 160 131 132 nil nil nil 135 138 130 136 nil 141 161 nil nil | |
| 291 nil 164 149 162 147 148 nil 246 nil 151 163 nil 129 nil nil nil] | |
| 292 "Table for converting ISO-8859-1 characters into codepage 860 glyphs.") | |
| 293 (setplist 'cp860-decode-table | |
| 294 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 295 | |
| 296 ;; Icelandic | |
| 297 (defvar cp861-decode-table | |
| 298 [ | |
| 299 255 173 nil 156 nil nil nil nil nil nil nil 174 170 nil nil nil | |
| 300 nil 241 253 nil nil nil nil 249 nil nil nil 175 172 171 nil 168 | |
| 301 nil 164 nil nil 142 143 146 128 nil 144 nil nil nil 165 nil nil | |
| 302 139 nil 159 166 nil nil 153 nil 157 nil 167 nil 154 151 141 nil | |
| 303 133 160 131 nil 132 134 145 135 138 130 136 137 nil 161 nil nil | |
| 304 140 nil nil 162 147 nil 148 246 155 nil 163 150 129 152 149 nil] | |
| 305 "Table for converting ISO-8859-1 characters into codepage 861 glyphs.") | |
| 306 (setplist 'cp861-decode-table | |
| 307 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 308 | |
| 309 ;; Hebrew | |
| 310 (defvar cp862-decode-table | |
| 311 ;; Nth element is the code of a cp862 glyph for the multibyte | |
| 312 ;; character created by (make-char 'hebrew-iso8859-8 (+ N 160)). | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
313 ;; The element nil means there's no corresponding cp862 glyph. |
| 23915 | 314 [ |
| 315 255 173 155 156 nil 157 179 nil nil nil nil 174 170 196 nil nil | |
| 316 248 241 253 nil nil 230 nil 249 nil nil 246 175 172 171 nil nil | |
| 317 nil nil nil nil nil nil nil nil nil nil nil nil nil nil nil nil | |
| 318 nil nil nil nil nil nil nil nil nil nil nil nil nil nil nil 205 | |
| 319 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 | |
| 320 144 145 146 147 148 149 150 151 152 153 154 nil nil nil nil nil] | |
| 321 "Table for converting ISO-8859-8 characters into codepage 862 glyphs.") | |
| 322 (setplist 'cp862-decode-table | |
| 323 '(charset hebrew-iso8859-8 language "Hebrew" offset 160)) | |
| 324 | |
| 325 ;; French Canadian | |
| 326 (defvar cp863-decode-table | |
| 327 [ | |
| 328 255 nil 155 156 152 nil 160 143 164 nil nil 174 170 nil nil 167 | |
| 329 nil 241 253 166 161 nil 134 249 165 nil nil 175 172 171 173 nil | |
| 330 142 nil 132 nil nil nil nil 128 145 144 146 148 nil nil 168 149 | |
| 331 nil nil nil nil 153 nil nil nil nil 157 nil 158 154 nil nil nil | |
| 332 133 nil 131 nil nil nil nil 135 138 130 136 137 141 nil 140 139 | |
| 333 nil nil nil 162 147 nil nil 246 nil 151 163 150 129 nil nil nil] | |
| 334 "Table for converting ISO-8859-1 characters into codepage 863 glyphs.") | |
| 335 (setplist 'cp863-decode-table | |
| 336 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 337 | |
| 338 ;; Arabic | |
| 339 ;; FIXME: Emacs doesn't seem to support the "Arabic" language | |
| 340 ;; environment yet. So this is only partially usable, for now | |
| 341 (defvar cp864-decode-table | |
| 342 [ | |
| 343 255 nil nil nil 164 nil nil nil nil nil nil nil 172 161 nil nil | |
| 344 nil nil nil nil nil nil nil nil nil nil nil 187 nil nil nil 191 | |
| 345 nil 193 194 195 196 nil 198 199 169 201 170 171 173 174 175 207 | |
| 346 208 209 210 188 189 190 235 215 216 223 238 nil nil nil nil nil | |
| 347 224 247 248 252 251 239 242 243 232 233 253 nil nil nil nil nil | |
| 348 nil 241 nil nil nil nil nil nil nil nil nil nil nil nil nil nil] | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
349 "Table for converting ISO-8859-6 characters into codepage 864 glyphs.") |
| 23915 | 350 (setplist 'cp864-decode-table |
| 351 '(charset arabic-iso8859-6 language nil offset 160)) | |
| 352 | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
353 ;; Arabic OEM codepage used by Windows |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
354 ;; FIXME: Emacs doesn't seem to support the "Arabic" language |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
355 ;; environment yet. So this is only partially usable, for now |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
356 (defvar cp720-decode-table |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
357 [ |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
358 255 nil nil nil 148 nil nil nil nil nil nil nil nil 196 nil nil |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
359 nil nil nil nil nil nil nil nil nil nil nil nil nil nil nil nil |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
360 nil 152 153 154 155 157 158 159 160 161 162 163 164 165 166 167 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
361 168 169 170 171 172 173 224 225 226 227 228 nil nil nil nil nil |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
362 149 229 231 232 233 234 235 236 237 238 239 241 242 243 244 245 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
363 246 145 146 nil nil nil nil nil nil nil nil nil nil nil nil nil] |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
364 "Table for converting ISO-8859-6 characters into codepage 720 glyphs.") |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
365 (setplist 'cp720-decode-table |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
366 '(charset arabic-iso8859-6 language nil offset 160)) |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
367 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
368 |
| 23915 | 369 ;; Nordic (Norwegian/Danish) |
| 370 (defvar cp865-decode-table | |
| 371 [ | |
| 372 255 173 nil 156 nil nil nil nil nil nil 166 174 170 nil nil nil | |
| 373 nil 241 253 nil nil nil nil 249 nil nil 167 175 172 171 nil 168 | |
| 374 nil nil nil nil 142 143 146 128 nil 144 nil nil nil nil nil nil | |
| 375 nil 165 nil nil nil nil 153 nil 157 nil nil nil 154 nil nil nil | |
| 376 133 160 131 nil 132 134 145 135 138 130 136 137 141 161 140 139 | |
| 377 nil 164 149 162 147 nil 148 246 155 151 163 150 129 nil nil 152] | |
| 378 "Table for converting ISO-8859-1 characters into codepage 865 glyphs.") | |
| 379 (setplist 'cp865-decode-table | |
| 380 '(charset latin-iso8859-1 language "Latin-1" offset 160)) | |
| 381 | |
|
34672
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
382 ;; Russian (Yes, another one! This one's supposed to be used |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
383 ;; on Windows as the Russian OEM code page.) |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
384 (defvar cp866-decode-table |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
385 [ |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
386 255 240 nil nil 242 nil nil 244 nil nil nil nil nil nil 246 nil |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
387 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
388 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
389 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 |
|
48363
ddfd9a0290fb
(cp866-decode-table): Fix the translation table.
Eli Zaretskii <eliz@gnu.org>
parents:
43956
diff
changeset
|
390 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
|
34672
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
391 252 241 nil nil 243 nil nil 245 nil nil nil nil nil nil 247 nil] |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
392 "Table for converting ISO-8859-5 characters into codepage 866 glyphs.") |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
393 (setplist 'cp866-decode-table |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
394 '(charset cyrillic-iso8859-5 language "Cyrillic-ISO" offset 160)) |
|
8f55d03259de
(cp866-decode-table): New table.
Eli Zaretskii <eliz@gnu.org>
parents:
30493
diff
changeset
|
395 |
| 23915 | 396 ;; Greek (yes, another one!) |
| 397 (defvar cp869-decode-table | |
| 398 [ | |
| 399 255 139 140 156 nil nil 138 245 249 151 nil 174 137 240 nil 142 | |
| 400 248 241 153 154 239 247 134 136 141 143 144 175 146 171 149 152 | |
| 401 161 164 165 166 167 168 169 170 172 173 181 182 183 184 189 190 | |
| 402 198 199 nil 207 208 209 210 211 212 213 145 150 155 157 158 159 | |
| 403 252 214 215 216 221 222 224 225 226 227 228 229 230 231 232 233 | |
| 404 234 235 237 236 238 242 243 244 246 250 160 251 162 163 253 nil] | |
| 405 "Table for converting ISO-8859-7 characters into codepage 869 glyphs.") | |
| 406 (setplist 'cp869-decode-table | |
| 407 '(charset greek-iso8859-7 language "Greek" offset 160)) | |
| 408 | |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
409 ;; Greek OEM codepage used by Windows |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
410 (defvar cp737-decode-table |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
411 [ |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
412 255 nil nil nil nil nil 179 nil nil nil nil nil nil 196 nil nil |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
413 248 241 253 nil nil nil 234 250 235 236 237 nil 238 nil 239 240 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
414 nil 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
415 143 144 nil 145 146 147 148 149 150 151 244 245 225 226 227 229 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
416 nil 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
417 167 168 170 169 171 172 173 174 175 224 228 232 230 231 233 nil] |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
418 "Table for converting ISO-8859-7 characters into codepage 737 glyphs.") |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
419 (setplist 'cp737-decode-table |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
420 '(charset greek-iso8859-7 language "Greek" offset 160)) |
|
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
421 |
| 36579 | 422 ;; Conversion from codepages 770-775 to Latin-4 for Baltic countries. |
| 423 ;; FIXME: Once we support Latin-7, these should be remapped into it. | |
| 424 (defvar cp770-decode-table | |
| 425 [ | |
| 426 255 143 nil nil 155 nil 156 nil 157 159 137 168 nil 196 146 nil | |
| 427 248 133 nil nil nil nil 134 nil nil 158 136 152 nil nil 145 nil | |
| 428 160 nil nil nil 142 nil nil 173 128 nil 139 nil 144 nil nil 161 | |
| 429 nil nil nil 163 nil 149 153 nil nil 167 nil nil 154 nil 166 225 | |
| 430 131 nil nil nil 132 nil nil 141 135 nil 138 nil 130 nil nil 140 | |
| 431 nil nil nil 162 nil 147 148 247 nil 151 nil nil 129 nil 150 nil] | |
| 432 "Table for converting ISO-8859-4 characters into codepage 770 glyphs.") | |
| 433 (setplist 'cp770-decode-table | |
| 434 '(charset latin-iso8859-4 language "Latin-4" offset 160)) | |
| 435 | |
| 436 (defvar cp773-decode-table | |
| 437 [ | |
| 438 255 220 nil 138 150 nil 234 190 166 246 237 149 173 196 252 nil | |
| 439 208 nil nil 139 239 nil 235 nil nil 247 137 133 136 nil 253 nil | |
| 440 160 nil nil nil 142 143 146 244 222 144 240 nil 242 nil nil 161 | |
| 441 nil 238 226 232 nil 229 153 158 157 248 nil nil 154 nil 250 225 | |
| 442 131 nil nil nil 132 134 145 245 223 130 241 nil 243 nil nil 140 | |
| 443 nil 236 147 233 nil 228 148 198 155 249 nil nil 129 nil 251 nil] | |
| 444 "Table for converting ISO-8859-4 characters into codepage 773 glyphs.") | |
| 445 (setplist 'cp773-decode-table | |
| 446 '(charset latin-iso8859-4 language "Latin-4" offset 160)) | |
| 447 | |
| 448 (defvar cp774-decode-table | |
| 449 [ | |
| 450 255 181 nil nil 155 nil nil nil 245 190 nil nil nil 196 207 nil | |
| 451 248 208 nil nil nil nil nil nil nil 213 nil nil nil nil 216 nil | |
| 452 nil nil nil nil 142 143 146 189 182 144 183 nil 184 nil nil nil | |
| 453 nil nil nil nil nil nil 153 nil nil 198 nil nil 154 nil 199 225 | |
| 454 nil 160 nil nil 132 134 145 212 209 130 210 137 211 161 140 nil | |
| 455 nil nil nil nil 147 nil 148 246 237 214 163 150 129 nil 215 248] | |
| 456 "Table for converting ISO-8859-4 characters into codepage 774 glyphs.") | |
| 457 (setplist 'cp774-decode-table | |
| 458 '(charset latin-iso8859-4 language "Latin-4" offset 160)) | |
| 459 | |
| 23915 | 460 (defvar cp775-decode-table |
| 461 [ | |
| 462 255 181 nil 138 150 nil 234 245 166 190 237 149 173 240 207 nil | |
| 36579 | 463 248 208 nil 139 239 nil 235 nil nil 213 137 133 136 nil 216 nil |
| 23915 | 464 160 nil nil nil 142 143 146 189 182 144 183 nil 184 nil nil 161 |
| 465 nil 238 226 232 nil 229 153 158 157 198 nil nil 154 nil 199 225 | |
| 466 131 nil nil nil 132 134 145 212 209 130 210 nil 211 nil nil 140 | |
| 36579 | 467 nil 236 147 233 nil 228 148 247 155 214 nil nil 129 nil 215 nil] |
| 23915 | 468 "Table for converting ISO-8859-4 characters into codepage 775 glyphs.") |
| 469 (setplist 'cp775-decode-table | |
| 470 '(charset latin-iso8859-4 language "Latin-4" offset 160)) | |
| 471 | |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
472 ;; Support for the Windows 12xx series of codepages that MS has |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
473 ;; butchered from the ISO-8859 specs. This does not add support for |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
474 ;; the extended characters that MS has added in the 128 - 159 coding |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
475 ;; range, only translates those characters that can be expressed in |
|
29922
9473e3466947
(cp-coding-system-for-codepage-1): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
29721
diff
changeset
|
476 ;; the corresponding iso-8859 charset. |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
477 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
478 ;; Codepage Mapping: |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
479 ;; |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
480 ;; Windows-1250: ISO-8859-2 (Central Europe) - differs in some positions |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
481 ;; Windows-1251: ISO-8859-5 (Cyrillic) - differs wildly |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
482 ;; Windows-1252: ISO-8859-1 (West Europe) - exact match |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
483 ;; Windows-1253: ISO-8859-7 (Greek) - differs in some positions |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
484 ;; Windows-1254: ISO-8859-9 (Turkish) - exact match |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
485 ;; Windows-1255: ISO-8859-8 (Hebrew) - exact match |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
486 ;; Windows-1256: ISO-8859-6 (Arabic) - half match |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
487 ;; Windows-1257: ISO-8859-4 (Baltic) - differs, future Latin-7 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
488 ;; Windows-1258: VISCII (Vietnamese) - Completely different |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
489 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
490 (defvar cp1250-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
491 [ |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
492 160 165 162 163 164 188 140 167 168 138 170 141 143 173 142 175 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
493 176 185 178 179 180 190 156 161 184 154 186 157 159 189 158 191 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
494 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
495 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
496 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
497 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 ] |
| 41946 | 498 "ISO-8859-2 to Windows-1250 (Central Europe) codepage decoding table.") |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
499 (setplist 'cp1250-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
500 '(charset latin-iso8859-2 language "Latin-2" offset 160)) |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
501 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
502 (defvar cp1251-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
503 [ |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
504 160 168 128 129 170 189 178 175 163 138 140 142 141 173 161 143 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
505 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
506 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
507 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
508 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
509 185 184 144 131 186 190 179 191 188 154 156 158 157 167 162 159 ] |
| 41946 | 510 "ISO-8859-5 to Windows-1251 (Cyrillic) codepage decoding table.") |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
511 (setplist 'cp1251-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
512 '(charset cyrillic-iso8859-5 language "Cyrillic-ISO" offset 160)) |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
513 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
514 ;; cp1253 is missing nbsp so we cannot quite translate perfectly. It |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
515 ;; also has two micro/mu characters which would require more complex |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
516 ;; processing to accomodate. |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
517 (defvar cp1253-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
518 [ |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
519 nil 145 146 163 nil nil 166 167 168 169 nil 171 172 173 nil 151 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
520 176 177 178 179 180 161 162 183 184 185 186 187 188 189 190 191 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
521 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
522 208 209 nil 211 212 213 214 215 216 217 218 219 220 221 222 223 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
523 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
524 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 nil ] |
| 41946 | 525 "ISO-8859-7 to Windows-1253 (Greek) codepage decoding table.") |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
526 (setplist 'cp1253-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
527 '(charset greek-iso8859-7 language "Greek" offset 160)) |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
528 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
529 ;; Since Latin-7 is not yet official, and Emacs does not support it, |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
530 ;; provide translation between Windows-1257 and Latin-4 the best we |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
531 ;; can. |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
532 (defvar cp1257-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
533 [ |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
534 160 192 nil 170 164 nil 207 167 nil 208 199 204 nil 173 222 nil |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
535 176 224 nil 186 nil nil 239 nil nil 240 231 236 nil nil 254 nil |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
536 194 nil nil nil 196 197 175 193 200 201 198 nil 203 nil nil 206 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
537 nil 210 212 205 nil 213 214 215 168 216 nil nil 220 nil 219 223 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
538 226 nil nil nil 228 229 191 225 232 233 230 nil 235 nil nil 238 |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
539 nil 242 244 237 nil 245 246 247 184 248 nil nil 252 nil 251 nil ] |
| 41946 | 540 "ISO-8859-4 to Windows-1257 (Baltic) codepage decoding table.") |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
541 (setplist 'cp1257-decode-table |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
542 '(charset latin-iso8859-4 language "Latin-4" offset 160)) |
|
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
543 |
| 23915 | 544 ;;;###autoload |
| 545 (defun cp-make-coding-systems-for-codepage (codepage iso-name offset) | |
|
23952
4ef8ec98dd43
(cp-make-coding-systems-for-codepage): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
23920
diff
changeset
|
546 "Create a coding system to convert IBM CODEPAGE into charset ISO-NAME |
| 23915 | 547 whose first character is at offset OFFSET from the beginning of 8-bit |
| 548 ASCII table. | |
| 549 | |
|
23952
4ef8ec98dd43
(cp-make-coding-systems-for-codepage): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
23920
diff
changeset
|
550 The created coding system has the usual 3 subsidiary systems: for Unix-, |
|
4ef8ec98dd43
(cp-make-coding-systems-for-codepage): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
23920
diff
changeset
|
551 DOS- and Mac-style EOL conversion. However, unlike built-in coding |
|
4ef8ec98dd43
(cp-make-coding-systems-for-codepage): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
23920
diff
changeset
|
552 systems, the Mac-style EOL conversion is currently not supported by the |
|
4ef8ec98dd43
(cp-make-coding-systems-for-codepage): Doc fix.
Eli Zaretskii <eliz@gnu.org>
parents:
23920
diff
changeset
|
553 decoder and encoder created by this function." |
| 23915 | 554 (let* ((decode-table (intern (format "%s-decode-table" codepage))) |
| 555 (nonascii-table | |
| 556 (intern (format "%s-nonascii-translation-table" codepage))) | |
| 557 (decode-translation | |
| 558 (intern (format "%s-decode-translation-table" codepage))) | |
| 559 (encode-translation | |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
560 (intern (format "%s-encode-translation-table" codepage)))) |
| 23915 | 561 (set nonascii-table |
| 562 (make-translation-table-from-vector | |
| 563 (cp-decoding-vector-for-codepage | |
| 564 (symbol-value decode-table) iso-name offset))) | |
| 565 (define-translation-table encode-translation | |
| 566 (char-table-extra-slot (symbol-value nonascii-table) 0)) | |
|
29180
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
567 ;; For charsets other than ascii, eight-bit-* and ISO-NAME, set |
|
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
568 ;; `?' for one-column charsets, and some Japanese character for |
| 23915 | 569 ;; wide-column charsets. CCL encoder convert that Japanese |
|
24279
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
570 ;; character to either dos-unsupported-char-glyph or "??". |
| 23915 | 571 (let ((tbl (char-table-extra-slot (symbol-value nonascii-table) 0)) |
|
24279
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
572 (undef (if (eq system-type 'ms-dos) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
573 (if dos-unsupported-char-glyph |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
574 (logand dos-unsupported-char-glyph 255) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
575 127) |
|
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
576 ??)) |
|
29180
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
577 (charsets (delq 'ascii |
|
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
578 (delq 'eight-bit-control |
|
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
579 (delq 'eight-bit-graphic |
|
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
580 (delq iso-name |
|
e2cb024e88cd
(cp-make-coding-systems-for-codepage):
Eli Zaretskii <eliz@gnu.org>
parents:
24662
diff
changeset
|
581 (copy-sequence charset-list)))))) |
| 23915 | 582 (wide-column-char (make-char 'japanese-jisx0208 32 32))) |
| 583 (while charsets | |
| 584 (aset tbl (make-char (car charsets)) | |
|
24279
7334c513dc7d
(cp-coding-system-for-codepage-1): On MS-DOS,
Eli Zaretskii <eliz@gnu.org>
parents:
24088
diff
changeset
|
585 (if (= (charset-width (car charsets)) 1) undef wide-column-char)) |
| 23915 | 586 (setq charsets (cdr charsets)))) |
| 587 (define-translation-table decode-translation | |
| 588 (symbol-value nonascii-table)) | |
| 589 (cp-coding-system-for-codepage-1 | |
|
23920
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
590 (intern codepage) ?D iso-name decode-translation encode-translation) |
|
efcf2fcda617
(cp-coding-system-for-codepage-1):
Eli Zaretskii <eliz@gnu.org>
parents:
23915
diff
changeset
|
591 )) |
| 23915 | 592 |
| 593 (defun cp-codepage-decoder (codepage) | |
|
41989
fd3c70d7a093
Follow doc-string conventions.
Pavel Jan?k <Pavel@Janik.cz>
parents:
41946
diff
changeset
|
594 "If CODEPAGE is the name of a supported codepage, return its decode table. |
|
fd3c70d7a093
Follow doc-string conventions.
Pavel Jan?k <Pavel@Janik.cz>
parents:
41946
diff
changeset
|
595 Otherwise return nil." |
| 23915 | 596 (let ((cp (if (symbolp codepage) (symbol-name codepage) codepage))) |
| 597 (cond | |
| 598 ((stringp cp) | |
| 599 (intern-soft (format "%s-decode-table" cp))) | |
| 600 (t nil)))) | |
| 601 | |
| 602 ;;;###autoload | |
| 603 (defun cp-charset-for-codepage (codepage) | |
| 604 "Return the charset for which there is a translation table to DOS CODEPAGE. | |
| 605 CODEPAGE must be the name of a DOS codepage, a string." | |
| 606 (let ((cp-decoder (cp-codepage-decoder codepage))) | |
| 607 (if (null cp-decoder) | |
| 608 (error "Unsupported codepage %s" codepage) | |
| 609 (get cp-decoder 'charset)))) | |
| 610 | |
| 611 ;;;###autoload | |
| 612 (defun cp-language-for-codepage (codepage) | |
| 613 "Return the name of the MULE language environment for CODEPAGE. | |
| 614 CODEPAGE must be the name of a DOS codepage, a string." | |
| 615 (let ((cp-decoder (cp-codepage-decoder codepage))) | |
| 616 (if (null cp-decoder) | |
| 617 (error "Unsupported codepage %s" codepage) | |
| 618 (get cp-decoder 'language)))) | |
| 619 | |
| 620 ;;;###autoload | |
| 621 (defun cp-offset-for-codepage (codepage) | |
| 622 "Return the offset to be used in setting up coding systems for CODEPAGE. | |
| 623 CODEPAGE must be the name of a DOS codepage, a string." | |
| 624 (let ((cp-decoder (cp-codepage-decoder codepage))) | |
| 625 (if (null cp-decoder) | |
| 626 (error "Unsupported codepage %s" codepage) | |
| 627 (get cp-decoder 'offset)))) | |
| 628 | |
| 629 ;;;###autoload | |
| 630 (defun cp-supported-codepages () | |
| 631 "Return an alist of supported codepages. | |
| 632 | |
| 633 Each association in the alist has the form (NNN . CHARSET), where NNN is the | |
| 634 codepage number, and CHARSET is the MULE charset which is the closest match | |
| 635 for the character set supported by that codepage. | |
| 636 | |
| 637 A codepage NNN is supported if a variable called `cpNNN-decode-table' exists, | |
| 638 is a vector, and has a charset property." | |
| 639 (save-match-data | |
| 640 (let (alist chset sname) | |
| 641 (mapatoms | |
| 642 (function | |
| 643 (lambda (sym) | |
| 644 (if (and (boundp sym) | |
|
24454
fe0089dd2d2f
(cp1250-decode-table, cp1251-decode-table, cp1253-decode-table,
Eli Zaretskii <eliz@gnu.org>
parents:
24371
diff
changeset
|
645 (string-match "\\`cp\\([1-9][0-9][0-9][0-9]?\\)-decode-table\\'" |
| 23915 | 646 (setq sname (symbol-name sym))) |
| 647 (vectorp (symbol-value sym)) | |
| 648 (setq chset (get sym 'charset))) | |
| 649 (setq alist | |
| 650 (cons (cons (match-string 1 sname) chset) alist)))))) | |
| 651 alist))) | |
| 652 | |
| 653 ;;;###autoload | |
| 654 (defun codepage-setup (codepage) | |
| 24033 | 655 "Create a coding system cpCODEPAGE to support the IBM codepage CODEPAGE. |
| 23915 | 656 |
| 657 These coding systems are meant for encoding and decoding 8-bit non-ASCII | |
| 658 characters used by the IBM codepages, typically in conjunction with files | |
| 24033 | 659 read/written by MS-DOS software, or for display on the MS-DOS terminal." |
| 23915 | 660 (interactive |
| 661 (let ((completion-ignore-case t) | |
| 662 (candidates (cp-supported-codepages))) | |
| 663 (list (completing-read "Setup DOS Codepage: (default 437) " candidates | |
| 664 nil t nil nil "437")))) | |
|
43956
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
665 (let* ((cp (format "cp%s" codepage)) |
|
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
666 (cp-defined (intern-soft cp))) |
|
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
667 (or (and cp-defined ;; avoid defining if already defined |
|
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
668 (coding-system-p cp-defined)) |
|
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
669 (cp-make-coding-systems-for-codepage |
|
858065a2176d
(codepage-setup): Don't define a codepage if it is already defined.
Eli Zaretskii <eliz@gnu.org>
parents:
41989
diff
changeset
|
670 cp (cp-charset-for-codepage cp) (cp-offset-for-codepage cp))))) |
| 23915 | 671 |
|
52435
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
672 ;; Add DOS codepages to `non-iso-charset-alist'. |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
673 (eval-after-load "mule-diag" |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
674 '(let ((tail (cp-supported-codepages)) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
675 elt) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
676 (while tail |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
677 (setq elt (car tail) tail (cdr tail)) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
678 ;; Now ELT is (CODEPAGE . CHARSET), where CODEPAGE is a string |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
679 ;; (e.g. "850"), CHARSET is a charset that characters in CODEPAGE |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
680 ;; are mapped to. |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
681 (unless (assq (intern (concat "cp" (car elt))) non-iso-charset-alist) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
682 (setq non-iso-charset-alist |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
683 (cons (list (intern (concat "cp" (car elt))) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
684 (list 'ascii (cdr elt)) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
685 `(lambda (code) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
686 (decode-codepage-char ,(string-to-int (car elt)) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
687 code)) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
688 (list (list 0 255))) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
689 non-iso-charset-alist)))))) |
|
528d8a1b09d5
("mule-diag"): Add eval-after-load
Dave Love <fx@gnu.org>
parents:
52401
diff
changeset
|
690 |
| 23915 | 691 (provide 'codepage) |
| 692 | |
| 52401 | 693 ;;; arch-tag: 80328de8-b94e-4386-be26-5876105731f0 |
|
38412
253f761ad37b
Some fixes to follow coding conventions in files maintained by FSF.
Pavel Jan?k <Pavel@Janik.cz>
parents:
36579
diff
changeset
|
694 ;;; codepage.el ends here |
