annotate lisp/language/tv-util.el @ 90938:ab2b53b01252

New file.
author Kenichi Handa <handa@m17n.org>
date Sat, 16 Jun 2007 01:57:15 +0000
parents
children bba587c2b334
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
90938
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1 ;;; tv-util.el --- support for Tai Viet -*- coding: utf-8 -*-
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
2
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
3 ;; Copyright (C) 2007
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
4 ;; National Institute of Advanced Industrial Science and Technology (AIST)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
5 ;; Registration Number H13PRO009
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
6
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
7 ;; Keywords: multilingual, Tai Viet, i18n
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
8
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
9 ;; This file is part of GNU Emacs.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
10
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
11 ;; GNU Emacs is free software; you can redistribute it and/or modify
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
12 ;; it under the terms of the GNU General Public License as published by
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
13 ;; the Free Software Foundation; either version 2, or (at your option)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
14 ;; any later version.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
15
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
16 ;; GNU Emacs is distributed in the hope that it will be useful,
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
19 ;; GNU General Public License for more details.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
20
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
21 ;; You should have received a copy of the GNU General Public License
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
22 ;; along with GNU Emacs; see the file COPYING. If not, write to the
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
23 ;; Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
24 ;; Boston, MA 02110-1301, USA.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
25
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
26 ;;; Code
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
27
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
28 ;; Regexp matching with a sequence of Tai Viet characters.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
29 (defconst tai-viet-re
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
30 (format "[\xaa80-\xaac2\xaadb-\xaadf]+"))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
31
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
32 ;; Char-table of information about glyph type of Tai Viet characters.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
33 (defconst tai-viet-glyph-info
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
34 (let ((table (make-char-table nil))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
35 (specials '((right-overhang . "ꪊꪋꪌꪍꪏꪓꪖꪜꪞꪡꪤꪨ")
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
36 (left-overhang . "ꫂ")
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
37 (combining-vowel . "ꪴꪰꪲꪳꪷꪸꪾ")
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
38 (combining-tone . "꪿꫁"))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
39 ;; Set all TaiViet characters to `t'.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
40 (set-char-table-range table (cons #xaa80 #xaac2) t)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
41 (set-char-table-range table (cons #xaadb #xaadf) t)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
42 ;; Overwrite it for special characters.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
43 (dolist (elt specials)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
44 (let ((category (car elt))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
45 (chars (cdr elt)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
46 (dotimes (i (length chars))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
47 (aset table (aref chars i) category))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
48 table))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
49
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
50 (defun tai-viet-compose-string (from to string)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
51 "Compose Tai Viet characters in STRING between indices FROM and TO."
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
52 (let* ((ch (aref string from))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
53 (info (aref tai-viet-glyph-info ch))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
54 prev-info)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
55 (if (eq info 'non-spacing)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
56 (compose-string string from (1+ from) (string ch ?\t)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
57 (setq from (1+ from) prev-info info)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
58 (while (and (< from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
59 (tai-viet-char-p (setq ch (aref string from))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
60 (setq info (aref tai-viet-glyph-info ch))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
61 (if (and (eq info 'non-spacing)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
62 (eq prev-info 'non-spacing))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
63 (compose-string from (1+ from) (string ?\t ch)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
64 (setq from (1+ from) prev-info info))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
65 (if (eq info 'right-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
66 (compose-string string (1- from) from (string ch ?\t)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
67 from))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
68
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
69 (defun tai-viet-compose-region (from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
70 "Compose Tai Viet characters in the region between FROM and TO."
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
71 (decompose-region from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
72 (let ((normal-rule '(Br . Bl))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
73 (tone-rule '(tr . bl))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
74 (prev-viet nil)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
75 ch info pos components overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
76 (while (< from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
77 (or ch
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
78 (setq ch (char-after from)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
79 info (aref tai-viet-glyph-info ch)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
80 (setq from (1+ from))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
81 (if (not info)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
82 (setq prev-viet nil
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
83 ch nil)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
84 (if (memq info '(combining-vowel combining-tone))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
85 (progn
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
86 ;; Display this as a spacing glyph.
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
87 (compose-region (1- from) from (string ?\t ch))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
88 (setq prev-viet t
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
89 ch nil))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
90 (setq pos (1- from)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
91 components ch
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
92 overhang (if (eq info 'right-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
93 'right-overhang
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
94 (if (and (not prev-viet) (eq info 'left-overhang))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
95 'left-overhang))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
96 prev-viet t
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
97 ch nil)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
98 (if (and (< from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
99 (setq ch (char-after from)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
100 info (aref tai-viet-glyph-info ch)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
101 (if (memq info '(combining-vowel combining-tone))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
102 (progn
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
103 (setq components
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
104 (list components normal-rule ch)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
105 from (1+ from)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
106 ch nil)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
107 (if (and (< from to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
108 (setq ch (char-after from)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
109 info (aref tai-viet-glyph-info ch))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
110 (eq info 'combining-tone))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
111 (setq components (nconc components
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
112 (list tone-rule ch))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
113 from (1+ from)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
114 (if (eq overhang 'left-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
115 (setq components (cons ?\t
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
116 (cons normal-rule components)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
117 (if (and (eq overhang 'right-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
118 (>= from to))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
119 (setq components (nconc components
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
120 (list normal-rule ?\t)))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
121 (compose-region pos from components))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
122 (if (eq overhang 'left-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
123 (compose-region pos from (string ?\t components))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
124 (if (eq overhang 'left-overhang)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
125 (compose-region pos from (string ?\t components))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
126 (if (and (eq overhang 'right-overhang) (>= from to))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
127 (compose-region pos from (string components ?\t))))))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
128 from))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
129
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
130
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
131 ;;;###autoload
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
132 (defun tai-viet-composition-function (pos &optional string)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
133 (let (to)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
134 (if string
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
135 (progn
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
136 (if (string-match tai-viet-re string pos)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
137 (tai-viet-compose-string pos (match-end 0) string)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
138 (1+ pos)))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
139 (goto-char pos)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
140 (if (looking-at tai-viet-re)
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
141 (tai-viet-compose-region pos (match-end 0))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
142 (1+ pos)))))
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
143
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
144 ;;
ab2b53b01252 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
145 (provide 'tai-viet-util)