Mercurial > emacs
annotate lisp/language/tibet-util.el @ 89452:6cc7c4aa53cc
(Fset_unibyte_charset): Fix setting up of
unibyte_to_multibyte_table.
(init_charset_once): Likewise.
author | Kenichi Handa <handa@m17n.org> |
---|---|
date | Fri, 30 May 2003 06:03:22 +0000 |
parents | 5b82d8f14d06 |
children | 2f877ed80fa6 |
rev | line source |
---|---|
36685 | 1 ;;; tibet-util.el --- utilities for Tibetan -*- coding: iso-2022-7bit; -*- |
17301 | 2 |
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN. | |
18377
8b4a66c66dd6
Change copyright notice.
Richard M. Stallman <rms@gnu.org>
parents:
18309
diff
changeset
|
4 ;; Licensed to the Free Software Foundation. |
17301 | 5 |
6 ;; Keywords: multilingual, Tibetan | |
7 | |
8 ;; This file is part of GNU Emacs. | |
9 | |
10 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
11 ;; it under the terms of the GNU General Public License as published by | |
12 ;; the Free Software Foundation; either version 2, or (at your option) | |
13 ;; any later version. | |
14 | |
15 ;; GNU Emacs is distributed in the hope that it will be useful, | |
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
18 ;; GNU General Public License for more details. | |
19 | |
20 ;; You should have received a copy of the GNU General Public License | |
21 ;; along with GNU Emacs; see the file COPYING. If not, write to the | |
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
23 ;; Boston, MA 02111-1307, USA. | |
24 | |
25 ;; Author: Toru TOMABECHI, <Toru.Tomabechi@orient.unil.ch> | |
26 | |
27 ;; Created: Feb. 17. 1997 | |
28 | |
38436
b174db545cfd
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
36685
diff
changeset
|
29 ;;; History: |
17301 | 30 ;; 1997.03.13 Modification in treatment of text properties; |
31 ;; Support for some special signs and punctuations. | |
26896 | 32 ;; 1999.10.25 Modification for a new composition way by K.Handa. |
17301 | 33 |
38436
b174db545cfd
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
36685
diff
changeset
|
34 ;;; Commentary: |
b174db545cfd
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
36685
diff
changeset
|
35 |
17301 | 36 ;;; Code: |
37 | |
17993
73869115ae0a
Most of setup-LANGUAGE-environment functions are
Kenichi Handa <handa@m17n.org>
parents:
17776
diff
changeset
|
38 ;;;###autoload |
26896 | 39 (defun tibetan-char-p (ch) |
40 "Check if char CH is Tibetan character. | |
41 Returns non-nil if CH is Tibetan. Otherwise, returns nil." | |
42 (memq (char-charset ch) '(tibetan tibetan-1-column))) | |
43 | |
44 ;;; Functions for Tibetan <-> Tibetan-transcription. | |
17301 | 45 |
46 ;;;###autoload | |
26896 | 47 (defun tibetan-tibetan-to-transcription (str) |
48 "Transcribe Tibetan string STR and return the corresponding Roman string." | |
49 (let (;; Accumulate transcriptions here in reverse order. | |
50 (trans nil) | |
51 (len (length str)) | |
52 (i 0) | |
53 ch this-trans) | |
54 (while (< i len) | |
29828 | 55 (let ((idx (string-match tibetan-precomposition-rule-regexp str i))) |
26896 | 56 (if (eq idx i) |
57 ;; Ith character and the followings matches precomposable | |
58 ;; Tibetan sequence. | |
59 (setq i (match-end 0) | |
60 this-trans | |
61 (car (rassoc | |
62 (cdr (assoc (match-string 0 str) | |
63 tibetan-precomposition-rule-alist)) | |
64 tibetan-precomposed-transcription-alist))) | |
65 (setq ch (substring str i (1+ i)) | |
66 i (1+ i) | |
67 this-trans | |
68 (car (or (rassoc ch tibetan-consonant-transcription-alist) | |
69 (rassoc ch tibetan-vowel-transcription-alist) | |
70 (rassoc ch tibetan-subjoined-transcription-alist))))) | |
71 (setq trans (cons this-trans trans)))) | |
72 (apply 'concat (nreverse trans)))) | |
17301 | 73 |
74 ;;;###autoload | |
26896 | 75 (defun tibetan-transcription-to-tibetan (str) |
76 "Convert Tibetan Roman string STR to Tibetan character string. | |
77 The returned string has no composition information." | |
78 (let (;; Case is significant. | |
17301 | 79 (case-fold-search nil) |
26896 | 80 (idx 0) |
81 ;; Accumulate Tibetan strings here in reverse order. | |
82 (t-str-list nil) | |
83 i subtrans) | |
84 (while (setq i (string-match tibetan-regexp str idx)) | |
85 (if (< idx i) | |
86 ;; STR contains a pattern that doesn't match Tibetan | |
87 ;; transcription. Include the pattern as is. | |
88 (setq t-str-list (cons (substring str idx i) t-str-list))) | |
89 (setq subtrans (match-string 0 str) | |
90 idx (match-end 0)) | |
91 (let ((t-char (cdr (assoc subtrans | |
92 tibetan-precomposed-transcription-alist)))) | |
93 (if t-char | |
94 ;; SUBTRANS corresponds to a transcription for | |
95 ;; precomposable Tibetan sequence. | |
96 (setq t-char (car (rassoc t-char | |
97 tibetan-precomposition-rule-alist))) | |
98 (setq t-char | |
99 (cdr | |
100 (or (assoc subtrans tibetan-consonant-transcription-alist) | |
101 (assoc subtrans tibetan-vowel-transcription-alist) | |
102 (assoc subtrans tibetan-modifier-transcription-alist) | |
103 (assoc subtrans tibetan-subjoined-transcription-alist))))) | |
104 (setq t-str-list (cons t-char t-str-list)))) | |
105 (if (< idx (length str)) | |
106 (setq t-str-list (cons (substring str idx) t-str-list))) | |
107 (apply 'concat (nreverse t-str-list)))) | |
17301 | 108 |
109 ;;; | |
26896 | 110 ;;; Functions for composing/decomposing Tibetan sequence. |
17301 | 111 ;;; |
112 ;;; A Tibetan syllable is typically structured as follows: | |
113 ;;; | |
114 ;;; [Prefix] C [C+] V [M] [Suffix [Post suffix]] | |
115 ;;; | |
116 ;;; where C's are all vertically stacked, V appears below or above | |
117 ;;; consonant cluster and M is always put above the C[C+]V combination. | |
118 ;;; (Sanskrit visarga, though it is a vowel modifier, is considered | |
119 ;;; to be a punctuation.) | |
120 ;;; | |
29828 | 121 ;;; Here are examples of the words "bsgrubs" and "hfauM" |
17301 | 122 ;;; |
89304
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
123 ;;; $(7"7"G###C"U"7"G(B $(7"H"R"U"_(B |
17301 | 124 ;;; |
125 ;;; M | |
126 ;;; b s b s h | |
29828 | 127 ;;; g fa |
17301 | 128 ;;; r u |
129 ;;; u | |
130 ;;; | |
26896 | 131 ;;; Consonants `'' ($(7"A(B), `w' ($(7">(B), `y' ($(7"B(B), `r' ($(7"C(B) take special |
132 ;;; forms when they are used as subjoined consonant. Consonant `r' | |
133 ;;; takes another special form when used as superjoined in such a case | |
134 ;;; as "rka", while it does not change its form when conjoined with | |
135 ;;; subjoined `'', `w' or `y' as in "rwa", "rya". | |
136 | |
137 ;; Append a proper composition rule and glyph to COMPONENTS to compose | |
138 ;; CHAR with a composition that has COMPONENTS. | |
17301 | 139 |
26896 | 140 (defun tibetan-add-components (components char) |
141 (let ((last (last components)) | |
142 (stack-upper '(tc . bc)) | |
143 (stack-under '(bc . tc)) | |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
144 rule comp-vowel tmp) |
26896 | 145 ;; Special treatment for 'a chung. |
146 ;; If 'a follows a consonant, turn it into the subjoined form. | |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
147 ;; * Disabled by Tomabechi 2000/06/09 * |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
148 ;; Because in Unicode, $(7"A(B may follow directly a consonant without |
89304
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
149 ;; any intervening vowel, as in $(7"9"""Q"A!;(B=$(7"9(B $(7""(B $(7"A(B not $(7"9(B $(7""(B $(7"Q(B $(7"A(B |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
150 ;;(if (and (= char ?$(7"A(B) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
151 ;; (aref (char-category-set (car last)) ?0)) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
152 ;; (setq char ?$(7"R(B)) ;; modified for new font by Tomabechi 1999/12/10 |
17301 | 153 |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
154 ;; Composite vowel signs are decomposed before being added |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
155 ;; Added by Tomabechi 2000/06/08 |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
156 (if (memq char '(?$(7"T(B ?$(7"V(B ?$(7"W(B ?$(7"X(B ?$(7"Y(B ?$(7"Z(B ?$(7"b(B)) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
157 (setq comp-vowel |
29828 | 158 (copy-sequence |
159 (cddr (assoc (char-to-string char) | |
160 tibetan-composite-vowel-alist))) | |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
161 char |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
162 (cadr (assoc (char-to-string char) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
163 tibetan-composite-vowel-alist)))) |
26896 | 164 (cond |
165 ;; Compose upper vowel sign vertically over. | |
166 ((aref (char-category-set char) ?2) | |
167 (setq rule stack-upper)) | |
17301 | 168 |
26896 | 169 ;; Compose lower vowel sign vertically under. |
170 ((aref (char-category-set char) ?3) | |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
171 (if (eq char ?$(7"Q(B) ;; `$(7"Q(B' should not visible when composed. |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
172 (setq rule nil) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
173 (setq rule stack-under))) |
26896 | 174 ;; Transform ra-mgo (superscribed r) if followed by a subjoined |
175 ;; consonant other than w, ', y, r. | |
176 ((and (= (car last) ?$(7"C(B) | |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
177 (not (memq char '(?$(7#>(B ?$(7"R(B ?$(7#B(B ?$(7#C(B)))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
178 (setcar last ?$(7!"(B) ;; modified for newfont by Tomabechi 1999/12/10 |
26896 | 179 (setq rule stack-under)) |
180 ;; Transform initial base consonant if followed by a subjoined | |
181 ;; consonant but 'a. | |
182 (t | |
183 (let ((laststr (char-to-string (car last)))) | |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
184 (if (and (/= char ?$(7"R(B) ;; modified for new font by Tomabechi |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
185 (string-match "[$(7"!(B-$(7"="?"@"D(B-$(7"J"K(B]" laststr)) |
26896 | 186 (setcar last (string-to-char |
187 (cdr (assoc (char-to-string (car last)) | |
188 tibetan-base-to-subjoined-alist))))) | |
189 (setq rule stack-under)))) | |
17301 | 190 |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
191 (if rule |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
192 (setcdr last (list rule char))) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
193 ;; Added by Tomabechi 2000/06/08 |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
194 (if comp-vowel |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
195 (nconc last comp-vowel)) |
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
196 )) |
17301 | 197 |
198 ;;;###autoload | |
199 (defun tibetan-compose-string (str) | |
26896 | 200 "Compose Tibetan string STR." |
201 (let ((idx 0)) | |
202 ;; `$(7"A(B' is included in the pattern for subjoined consonants | |
203 ;; because we treat it specially in tibetan-add-components. | |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
204 ;; (This feature is removed by Tomabechi 2000/06/08) |
26896 | 205 (while (setq idx (string-match tibetan-composable-pattern str idx)) |
206 (let ((from idx) | |
207 (to (match-end 0)) | |
208 components) | |
209 (if (eq (string-match tibetan-precomposition-rule-regexp str idx) idx) | |
210 (setq idx (match-end 0) | |
211 components | |
212 (list (string-to-char | |
213 (cdr | |
214 (assoc (match-string 0 str) | |
215 tibetan-precomposition-rule-alist))))) | |
216 (setq components (list (aref str idx)) | |
217 idx (1+ idx))) | |
218 (while (< idx to) | |
219 (tibetan-add-components components (aref str idx)) | |
220 (setq idx (1+ idx))) | |
221 (compose-string str from to components)))) | |
222 str) | |
17301 | 223 |
19553
e63ba5228950
(tibetan-composition): Add autoload cookies.
Kenichi Handa <handa@m17n.org>
parents:
19366
diff
changeset
|
224 ;;;###autoload |
26896 | 225 (defun tibetan-compose-region (beg end) |
226 "Compose Tibetan text the region BEG and END." | |
17301 | 227 (interactive "r") |
26896 | 228 (let (str result chars) |
17301 | 229 (save-excursion |
230 (save-restriction | |
231 (narrow-to-region beg end) | |
232 (goto-char (point-min)) | |
26896 | 233 ;; `$(7"A(B' is included in the pattern for subjoined consonants |
234 ;; because we treat it specially in tibetan-add-components. | |
29596
c3845ffcb423
Convert all tibetan-1-column characters
Kenichi Handa <handa@m17n.org>
parents:
29363
diff
changeset
|
235 ;; (This feature is removed by Tomabechi 2000/06/08) |
26896 | 236 (while (re-search-forward tibetan-composable-pattern nil t) |
237 (let ((from (match-beginning 0)) | |
238 (to (match-end 0)) | |
239 components) | |
240 (goto-char from) | |
241 (if (looking-at tibetan-precomposition-rule-regexp) | |
242 (progn | |
243 (setq components | |
244 (list (string-to-char | |
245 (cdr | |
246 (assoc (match-string 0) | |
247 tibetan-precomposition-rule-alist))))) | |
248 (goto-char (match-end 0))) | |
249 (setq components (list (char-after from))) | |
250 (forward-char 1)) | |
251 (while (< (point) to) | |
252 (tibetan-add-components components (following-char)) | |
253 (forward-char 1)) | |
254 (compose-region from to components))))))) | |
17301 | 255 |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
256 (defvar tibetan-decompose-precomposition-alist |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
257 (mapcar (function (lambda (x) (cons (string-to-char (cdr x)) (car x)))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
258 tibetan-precomposition-rule-alist)) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
259 |
17301 | 260 ;;;###autoload |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
261 (defun tibetan-decompose-region (from to) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
262 "Decompose Tibetan text in the region FROM and TO. |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
263 This is different from decompose-region because precomposed Tibetan characters |
42839 | 264 are decomposed into normal Tibetan character sequences." |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
265 (interactive "r") |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
266 (save-restriction |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
267 (narrow-to-region from to) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
268 (decompose-region from to) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
269 (goto-char from) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
270 (while (not (eobp)) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
271 (let* ((char (following-char)) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
272 (slot (assq char tibetan-decompose-precomposition-alist))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
273 (if slot |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
274 (progn |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
275 (delete-char 1) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
276 (insert (cdr slot))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
277 (forward-char 1)))))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
278 |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
279 |
26896 | 280 ;;;###autoload |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
281 (defun tibetan-decompose-string (str) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
282 "Decompose Tibetan string STR. |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
283 This is different from decompose-string because precomposed Tibetan characters |
42839 | 284 are decomposed into normal Tibetan character sequences." |
29363
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
285 (let ((new "") |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
286 (len (length str)) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
287 (idx 0) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
288 char slot) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
289 (while (< idx len) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
290 (setq char (aref str idx) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
291 slot (assq (aref str idx) tibetan-decompose-precomposition-alist) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
292 new (concat new (if slot (cdr slot) (char-to-string char))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
293 idx (1+ idx))) |
1ebd8db9c3dc
(tibetan-add-components): Fixes for new
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
294 new)) |
26896 | 295 |
296 ;;;###autoload | |
89304
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
297 (defun tibetan-composition-function (pos &optional string) |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
298 (setq pos (1- pos)) |
26896 | 299 (if string |
89304
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
300 ;; Not yet implemented. |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
301 nil |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
302 (if (>= pos (point-min)) |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
303 (save-excursion |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
304 (goto-char pos) |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
305 (if (looking-at tibetan-composable-pattern) |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
306 (prog1 (match-end 0) |
5b82d8f14d06
(tibetan-composition-function): Change
Kenichi Handa <handa@m17n.org>
parents:
42839
diff
changeset
|
307 (tibetan-compose-region pos (match-end 0)))))))) |
17301 | 308 |
309 ;;; | |
310 ;;; This variable is used to avoid repeated decomposition. | |
311 ;;; | |
312 (setq-default tibetan-decomposed nil) | |
313 | |
314 ;;;###autoload | |
315 (defun tibetan-decompose-buffer () | |
316 "Decomposes Tibetan characters in the buffer into their components. | |
26896 | 317 See also the documentation of the function `tibetan-decompose-region'." |
17301 | 318 (interactive) |
319 (make-local-variable 'tibetan-decomposed) | |
320 (cond ((not tibetan-decomposed) | |
321 (tibetan-decompose-region (point-min) (point-max)) | |
322 (setq tibetan-decomposed t)))) | |
323 | |
324 ;;;###autoload | |
325 (defun tibetan-compose-buffer () | |
326 "Composes Tibetan character components in the buffer. | |
327 See also docstring of the function tibetan-compose-region." | |
328 (interactive) | |
329 (make-local-variable 'tibetan-decomposed) | |
330 (tibetan-compose-region (point-min) (point-max)) | |
331 (setq tibetan-decomposed nil)) | |
332 | |
333 ;;;###autoload | |
334 (defun tibetan-post-read-conversion (len) | |
335 (save-excursion | |
336 (save-restriction | |
337 (let ((buffer-modified-p (buffer-modified-p))) | |
338 (narrow-to-region (point) (+ (point) len)) | |
339 (tibetan-compose-region (point-min) (point-max)) | |
340 (set-buffer-modified-p buffer-modified-p) | |
20107
4595a463b105
(tibetan-post-read-conversion): Return
Kenichi Handa <handa@m17n.org>
parents:
19553
diff
changeset
|
341 (make-local-variable 'tibetan-decomposed) |
4595a463b105
(tibetan-post-read-conversion): Return
Kenichi Handa <handa@m17n.org>
parents:
19553
diff
changeset
|
342 (setq tibetan-decomposed nil) |
4595a463b105
(tibetan-post-read-conversion): Return
Kenichi Handa <handa@m17n.org>
parents:
19553
diff
changeset
|
343 (- (point-max) (point-min)))))) |
17301 | 344 |
345 | |
346 ;;;###autoload | |
347 (defun tibetan-pre-write-conversion (from to) | |
348 (setq tibetan-decomposed-temp tibetan-decomposed) | |
23522
0f86fe9632e0
(tibetan-pre-write-conversion): Use with-temp-buffer.
Kenichi Handa <handa@m17n.org>
parents:
22987
diff
changeset
|
349 (let ((old-buf (current-buffer))) |
23545
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
350 (set-buffer (generate-new-buffer " *temp*")) |
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
351 (if (stringp from) |
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
352 (insert from) |
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
353 (insert-buffer-substring old-buf from to)) |
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
354 (if (not tibetan-decomposed-temp) |
0d25c6f765ab
(tibetan-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23522
diff
changeset
|
355 (tibetan-decompose-region (point-min) (point-max))) |
17776
ece62fdeeebb
(tibetan-pre-write-conversion): Make it work
Kenichi Handa <handa@m17n.org>
parents:
17315
diff
changeset
|
356 ;; Should return nil as annotations. |
ece62fdeeebb
(tibetan-pre-write-conversion): Make it work
Kenichi Handa <handa@m17n.org>
parents:
17315
diff
changeset
|
357 nil)) |
17301 | 358 |
18309
bd8b521f5218
Provide XXX-util instead of
Kenichi Handa <handa@m17n.org>
parents:
17993
diff
changeset
|
359 (provide 'tibet-util) |
17301 | 360 |
38436
b174db545cfd
Some fixes to follow coding conventions.
Pavel Janík <Pavel@Janik.cz>
parents:
36685
diff
changeset
|
361 ;;; tibet-util.el ends here |