Mercurial > emacs
changeset 89750:d6d9f1efd684
New file.
author | Kenichi Handa <handa@m17n.org> |
---|---|
date | Tue, 27 Jan 2004 01:59:12 +0000 |
parents | f30ee7fd9c53 |
children | a6bed93396e8 |
files | admin/charsets/cp51932.awk admin/charsets/eucjp-ms.awk |
diffstat | 2 files changed, 140 insertions(+), 0 deletions(-) [+] |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/admin/charsets/cp51932.awk Tue Jan 27 01:59:12 2004 +0000 @@ -0,0 +1,57 @@ +# cp51932.awk -- Generate a translation table for CP51932. +# Copyright (C) 2004 +# National Institute of Advanced Industrial Science and Technology (AIST) +# Registration Number H13PRO009 +# +# This file is part of GNU Emacs. +# +# GNU Emacs is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2, or (at your option) +# any later version. +# +# GNU Emacs is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with GNU Emacs; see the file COPYING. If not, write to the +# Free Software Foundation, Inc., 59 Temple Place - Suite 330, +# Boston, MA 02111-1307, USA. + +# Comment: + +# Genereate a translation table for CP51932 (EUC-JP of MicroSoft Version). +# It maps invalid JISX0208 code points used by CP51932 to Unicode. +# 4th field of the input has these meanings: +# 0: JISX0208 characters. +# 1: NEC special characters. +# 2: IBM extension characters. +# 3: NEC selection of IBM extension characters. +# Among them, 1 and 3 are the target characters. 2 should have +# already been mapped to 1 or 3. + +BEGIN { + print ";;; cp51932.el -- translation table for CP51932. -*- no-byte-compile: t -*-"; + print ";;; Automatically genrated from CP932-2BYTE.map"; + print "(let ((map"; + printf " '(;JISEXT<->UNICODE"; +} + +/# [13]/ { + printf "\n (#x%s . #x%s)", $5 ,substr($2, 3, 4); +} + +END { + print ")))"; + print " (mapc #'(lambda (x)"; + print " (setcar x (decode-char 'japanese-jisx0208 (car x))))"; + print " map)"; + print " (define-translation-table 'cp51932-decode map)"; + print " (mapc #'(lambda (x)"; + print " (let ((tmp (car x)))"; + print " (setcar x (cdr x)) (setcdr x tmp)))"; + print " map)"; + print " (define-translation-table 'cp51932-encode map))"; +}
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/admin/charsets/eucjp-ms.awk Tue Jan 27 01:59:12 2004 +0000 @@ -0,0 +1,83 @@ +# eucjp-ms.awk -- Generate a translation table for eucJP-ms. +# Copyright (C) 2004 +# National Institute of Advanced Industrial Science and Technology (AIST) +# Registration Number H13PRO009 +# +# This file is part of GNU Emacs. +# +# GNU Emacs is free software; you can redistribute it and/or modify +# it under the terms of the GNU General Public License as published by +# the Free Software Foundation; either version 2, or (at your option) +# any later version. +# +# GNU Emacs is distributed in the hope that it will be useful, +# but WITHOUT ANY WARRANTY; without even the implied warranty of +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the +# GNU General Public License for more details. +# +# You should have received a copy of the GNU General Public License +# along with GNU Emacs; see the file COPYING. If not, write to the +# Free Software Foundation, Inc., 59 Temple Place - Suite 330, +# Boston, MA 02111-1307, USA. + +# Comment: + +# eucJP-ms is one of eucJP-open encoding defined at this page: +# http://www.opengroup.or.jp/jvc/cde/appendix.html + +BEGIN { + print ";;; eucjp-ms.el -- translation table for eucJP-ms. -*- no-byte-compile: t -*-"; + print ";;; Automatically genrated from eucJP-13th.txt, eucJP-udc.txt, eucJP-ibmext.txt"; + print "(let ((map"; + printf " '(;JISEXT<->UNICODE"; + + tohex["A"] = 10; + tohex["B"] = 11; + tohex["C"] = 12; + tohex["D"] = 13; + tohex["E"] = 14; + tohex["F"] = 15; +} + +function decode_hex(str) { + n = 0; + len = length(str); + for (i = 1; i <= len; i++) + { + c = substr(str, i, 1); + if (c >= "0" && c <= "9") + n = n * 16 + (c - "0"); + else + n = n * 16 + tohex[c]; + } + return n; +} + +/0x8F/ { + code = decode_hex(substr($1, 5, 4)); + code -= 32896; # code -= 0x8080 + printf "\n (#x%04x #x%s)", code, substr($2, 3, 4); + next; +} + +/0x[A-F]/ { + code = decode_hex(substr($1, 3, 4)); + code -= 32896; # code -= 0x8080 + printf "\n (#x%04x . #x%s)", code, substr($2, 3, 4); +} + +END { + print ")))"; + print " (mapc #'(lambda (x)"; + print " (if (integerp (cdr x))"; + print " (setcar x (decode-char 'japanese-jisx0208 (car x)))"; + print " (setcar x (decode-char 'japanese-jisx0212 (car x)))"; + print " (setcdr x (cadr x))))"; + print " map)"; + print " (define-translation-table 'eucjp-ms-decode map)"; + print " (mapc #'(lambda (x)"; + print " (let ((tmp (car x)))"; + print " (setcar x (cdr x)) (setcdr x tmp)))"; + print " map)"; + print " (define-translation-table 'eucjp-ms-encode map))"; +}