comparison admin/charsets/mapconv @ 89742:a750cf193ec6

Handle UNICODE2.
author Kenichi Handa <handa@m17n.org>
date Sun, 25 Jan 2004 08:12:37 +0000
parents 375f2633d815
children b7afe7c870d3
comparison
equal deleted inserted replaced
89741:fb91cfc5ed37 89742:a750cf193ec6
42 CZYBORRA) 42 CZYBORRA)
43 SOURCE="http://czyborra.com/charsets/${BASE}";; 43 SOURCE="http://czyborra.com/charsets/${BASE}";;
44 IANA) 44 IANA)
45 SOURCE="http://www.iana.org/assignments/charset-reg/${BASE}";; 45 SOURCE="http://www.iana.org/assignments/charset-reg/${BASE}";;
46 UNICODE) 46 UNICODE)
47 SOURCE="http://www.unicode.org/Public/MAPPINGS/.../${BASE}";;
48 UNICODE2)
47 SOURCE="http://www.unicode.org/Public/MAPPINGS/.../${BASE}";; 49 SOURCE="http://www.unicode.org/Public/MAPPINGS/.../${BASE}";;
48 YASUOKA) 50 YASUOKA)
49 SOURCE="http://kanji.zinbun.kyoto-u.ac.jp/~yasuoka/.../${BASE}";; 51 SOURCE="http://kanji.zinbun.kyoto-u.ac.jp/~yasuoka/.../${BASE}";;
50 MICROSOFT) 52 MICROSOFT)
51 SOURCE="http://www.microsoft.com/globaldev/reference/oem/${BASE}";; 53 SOURCE="http://www.microsoft.com/globaldev/reference/oem/${BASE}";;
105 # Source format is: 107 # Source format is:
106 # YYYY XX 108 # YYYY XX
107 sed -n -e "$2 p" < $1 \ 109 sed -n -e "$2 p" < $1 \
108 | sed -e 's/\([0-9A-F]*\)[^0-9A-F]*\([0-9A-F]*\).*/0x\2 0x\1/' \ 110 | sed -e 's/\([0-9A-F]*\)[^0-9A-F]*\([0-9A-F]*\).*/0x\2 0x\1/' \
109 | sort | ${AWKPROG} 111 | sort | ${AWKPROG}
112 elif [ "$3" == "UNICODE2" ] ; then
113 # Source format is:
114 # 0xXXXX 0xYYYY # ...
115 sed -n -e "$2 p" < $1 \
116 | sed -e 's/\([0-9A-Fx]*\)[^0]*\([0-9A-Fx]*\).*/\1 \2/' \
117 | sort | ${AWKPROG}
110 elif [ "$3" == "YASUOKA" ] ; then 118 elif [ "$3" == "YASUOKA" ] ; then
111 # Source format is: 119 # Source format is:
112 # YYYY 0-XXXX (XXXX is a Kuten code) 120 # YYYY 0-XXXX (XXXX is a Kuten code)
113 sed -n -e "$2 p" < $1 \ 121 sed -n -e "$2 p" < $1 \
114 | sed -e 's/\([0-9A-F]*\)[^0]*0-\([0-9]*\).*/0x\2 0x\1/' \ 122 | sed -e 's/\([0-9A-F]*\)[^0]*0-\([0-9]*\).*/0x\2 0x\1/' \