changeset 89742:a750cf193ec6

Handle UNICODE2.
author Kenichi Handa <handa@m17n.org>
date Sun, 25 Jan 2004 08:12:37 +0000
parents fb91cfc5ed37
children 664a98295b6d
files admin/charsets/mapconv
diffstat 1 files changed, 8 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- a/admin/charsets/mapconv	Sun Jan 25 07:51:12 2004 +0000
+++ b/admin/charsets/mapconv	Sun Jan 25 08:12:37 2004 +0000
@@ -45,6 +45,8 @@
 	SOURCE="http://www.iana.org/assignments/charset-reg/${BASE}";;
     UNICODE)
 	SOURCE="http://www.unicode.org/Public/MAPPINGS/.../${BASE}";;
+    UNICODE2)
+	SOURCE="http://www.unicode.org/Public/MAPPINGS/.../${BASE}";;
     YASUOKA)
 	SOURCE="http://kanji.zinbun.kyoto-u.ac.jp/~yasuoka/.../${BASE}";;
     MICROSOFT)
@@ -107,6 +109,12 @@
     sed -n -e "$2 p" < $1 \
 	| sed -e 's/\([0-9A-F]*\)[^0-9A-F]*\([0-9A-F]*\).*/0x\2 0x\1/' \
 	| sort | ${AWKPROG}
+elif [ "$3" == "UNICODE2" ] ; then
+    # Source format is:
+    #   0xXXXX	0xYYYY	# ...
+    sed -n -e "$2 p" < $1 \
+	| sed -e 's/\([0-9A-Fx]*\)[^0]*\([0-9A-Fx]*\).*/\1 \2/' \
+	| sort | ${AWKPROG}
 elif [ "$3" == "YASUOKA" ] ; then
     # Source format is:
     # YYYY	0-XXXX (XXXX is a Kuten code)