Mercurial > emacs
annotate lisp/language/devan-util.el @ 37068:ac894ffb7b16
*** empty log message ***
author | Eli Zaretskii <eliz@gnu.org> |
---|---|
date | Thu, 29 Mar 2001 15:38:09 +0000 |
parents | 0c75fe9804e2 |
children | b174db545cfd |
rev | line source |
---|---|
17052 | 1 ;;; devan-util.el --- Support for Devanagari Script Composition |
2 | |
36680
0c75fe9804e2
Add coding: tag in Local Variables: section.
Kenichi Handa <handa@m17n.org>
parents:
31446
diff
changeset
|
3 ;; Copyright (C) 1996, 2001 Free Software Foundation, Inc. |
17052 | 4 |
5 ;; Author: KAWABATA, Taichi <kawabata@is.s.u-tokyo.ac.jp> | |
6 | |
7 ;; Keywords: multilingual, Indian, Devanagari | |
8 | |
9 ;; This file is part of GNU Emacs. | |
10 | |
11 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
12 ;; it under the terms of the GNU General Public License as published by | |
13 ;; the Free Software Foundation; either version 2, or (at your option) | |
14 ;; any later version. | |
15 | |
16 ;; GNU Emacs is distributed in the hope that it will be useful, | |
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
19 ;; GNU General Public License for more details. | |
20 | |
21 ;; You should have received a copy of the GNU General Public License | |
17314
f438ebf1c679
Fix FSF address in comment.
Kenichi Handa <handa@m17n.org>
parents:
17300
diff
changeset
|
22 ;; along with GNU Emacs; see the file COPYING. If not, write to the |
f438ebf1c679
Fix FSF address in comment.
Kenichi Handa <handa@m17n.org>
parents:
17300
diff
changeset
|
23 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
f438ebf1c679
Fix FSF address in comment.
Kenichi Handa <handa@m17n.org>
parents:
17300
diff
changeset
|
24 ;; Boston, MA 02111-1307, USA. |
17052 | 25 |
26 ;;; Commentary: | |
27 | |
28 ;; History: | |
29 ;; 1996.10.18 written by KAWABATA, Taichi <kawabata@is.s.u-tokyo.ac.jp> | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
30 ;; 1997.3.24 fixed some bugs. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
31 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
32 ;; Future work :: |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
33 ;; Decompose the input characters and process them on the character basis. |
17052 | 34 |
35 ;; Devanagari script composition rules and related programs. | |
36 | |
37 ;;; Code: | |
38 | |
39 ;;; | |
40 ;;; Steps toward composition of Devanagari Characters. | |
41 ;;; | |
22987
708271862495
(setup-XXX-environment): Just call set-language-environment. If
Kenichi Handa <handa@m17n.org>
parents:
22520
diff
changeset
|
42 |
17052 | 43 ;;; Basic functions. |
44 | |
45 ;;;###autoload | |
26894 | 46 (defun indian-to-devanagari (char) |
47 "Convert IS 13194 character CHAR to Devanagari basic characters. | |
48 If CHAR is not IS 13194, return CHAR as is." | |
49 (let ((charcodes (split-char char))) | |
17052 | 50 (if (eq (car charcodes) 'indian-is13194) |
51 (make-char 'indian-2-column ?\x21 (nth 1 charcodes)) | |
26894 | 52 char))) |
17052 | 53 |
54 ;;;###autoload | |
26894 | 55 (defun devanagari-to-indian (char) |
56 "Convert Devanagari basic character CHAR to IS 13194 characters. | |
57 If CHAR is not Devanagari basic character, return CHAR as is." | |
58 (let ((charcodes (split-char char))) | |
17052 | 59 (if (and (eq (car charcodes) 'indian-2-column) |
60 (= (nth 1 charcodes) ?\x21)) | |
61 (make-char 'indian-is13194 (nth 2 charcodes)) | |
26894 | 62 char))) |
17052 | 63 |
64 ;;;###autoload | |
65 (defun indian-to-devanagari-region (from to) | |
26894 | 66 "Convert IS 13194 characters in region to Devanagari basic characters. |
67 When called from a program, expects two arguments, | |
68 positions (integers or markers) specifying the region." | |
17052 | 69 (interactive "r") |
26894 | 70 (save-excursion |
71 (goto-char from) | |
72 (while (< (point) to) | |
73 (let ((char (following-char))) | |
74 (if (eq (char-charset char) 'indian-is13194) | |
75 (progn | |
76 (delete-char 1) | |
77 (insert (indian-to-devanagari char))) | |
78 (forward-char 1)))))) | |
17052 | 79 |
80 ;;;###autoload | |
81 (defun devanagari-to-indian-region (from to) | |
26894 | 82 "Convert Devanagari basic characters in region to Indian characters. |
83 When called from a program, expects two arguments, | |
84 positions (integers or markers) specifying the region." | |
17052 | 85 (interactive "r") |
26894 | 86 (save-excursion |
87 (goto-char from) | |
88 (while (< (point) to) | |
89 (let ((char (following-char))) | |
90 (if (eq (char-charset char) 'indian-2-column) | |
91 (progn | |
31446
1cc26c3824f9
(devanagari-to-indian-region): In the loop, change the following char,
Kenichi Handa <handa@m17n.org>
parents:
28906
diff
changeset
|
92 (delete-char 1) |
26894 | 93 (insert (devanagari-to-indian char))) |
94 (forward-char 1)))))) | |
17052 | 95 |
96 ;;;###autoload | |
26894 | 97 (defun indian-to-devanagari-string (string) |
98 "Convert Indian characters in STRING to Devanagari Basic characters." | |
99 (let* ((len (length string)) | |
20839 | 100 (i 0) |
101 (vec (make-vector len 0))) | |
102 (while (< i len) | |
26894 | 103 (aset vec i (indian-to-devanagari (aref string i))) |
20839 | 104 (setq i (1+ i))) |
105 (concat vec))) | |
17052 | 106 |
107 ;; Phase 0 - Determine whether the characters can be composed. | |
108 ;; | |
109 ;;; | |
110 ;;; Regular expressions to split characters for composition. | |
111 ;;; | |
112 ;; | |
113 ;; Indian script word contains one or more syllables. | |
114 ;; In BNF, it can be expressed as follows: | |
115 ;; | |
116 ;; Word ::= {Syllable} [Cons-Syllable] | |
117 ;; Syllable ::= Cons-Vowel-Syllable | Vowel-Syllable | |
118 ;; Vowel-Syllable ::= V[D] | |
119 ;; Cons-Vowel-Syllable ::= [Cons-Syllable] Full-Cons [M] [D] | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
120 ;; Cons-Syllable ::= [Pure-Cons] [Pure-Cons] [Pure-Cons] Pure-Cons |
17052 | 121 ;; Pure-Cons ::= Full-Cons H |
122 ;; Full-Cons ::= C [N] | |
123 ;; | |
124 ;; {} repeat, [] optional | |
125 ;; | |
126 ;; C - Consonant ($(5!3!4!5!6!7!8!9!:!;!<!=!>!?!@!A!B!C!D!E(B | |
127 ;; $(5!F!G!H!I!J!K!L!M!N!O!P!Q!R!S!T!U!V!W!X(B) | |
128 ;; N - Nukta ($(5!i(B) | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
129 ;; H - Halant($(5!h(B) or Virama |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
130 ;; V - Vowel ($(5!$!%!&!'!(!)!*!+!,!-!.!/!0!1!2#&#'#*(B) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
131 ;; ("$(5#&#'#*(B" can be obtained by IS13194 vowels with nukta.) |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
132 ;; D - Vowel Modifiers, i.e. Anuswar, Chandrabindu ($(5!!!"(B) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
133 ;; (Visaraga ($(5!#(B) is excluded.) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
134 ;; M - Matra ($(5!Z![!\!]!^!_!`!a!b!c!d!e!f!g#K#L#M(B) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
135 ;; ("$(5#K#L#M(B" can be obtained by IS13194 matras with nukta.) |
17052 | 136 ;; |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
137 ;; In Emacs, one syllable of Indian language is considered to be one |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
138 ;; composite glyph. If we expand the above expression for |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
139 ;; cons-vowel-syllable, it would be: |
17052 | 140 ;; |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
141 ;; [[C [N] H] [C [N] H] [C [N] H] C [N] H] C [N] [M] [D] |
17052 | 142 ;; |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
143 ;; Therefore, in worst case, the one syllable may contain |
17052 | 144 ;; following characters. |
145 ;; | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
146 ;; C N H C N H C N H C N H C N M D |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
147 ;; |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
148 ;; The example is a sanskrit word "kArtsnya", where five consecutive |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
149 ;; consonants appear. |
17052 | 150 ;; |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
151 ;; On the other hand, consonant-syllable, which appears at the end of |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
152 ;; the word, would have the following expression: |
17052 | 153 ;; |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
154 ;; [C [N] H] [C [N] H] [C [N] H] C [N] H |
17052 | 155 ;; |
156 ;; This is acceptable BEFORE proper consonant-syllable is input. The | |
157 ;; string which doesn't match with the above expression is invalid and | |
158 ;; thus must be fixed. | |
159 ;; | |
160 ;; Note: | |
21442 | 161 ;; Third case can be considered, which is an acceptable syllable and can |
17052 | 162 ;; not add any code more. |
163 ;; | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
164 ;; [[C [N] H] [C [N] H] [C [N] H] C [N] H] C [N] [M] D |
17052 | 165 ;; |
166 ;; However, to make editing possible even in this condition, we will | |
167 ;; not consider about this case. | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
168 ;; |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
169 ;; Note: |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
170 ;; Currently, it seems that the only following consonants would have |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
171 ;; Nukta sign attatched. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
172 ;; ($(5!3!4!5!:!?!@!I(B) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
173 ;; Therefore, [$(5!3(B-$(5!X(B]$(5!i(B? can be re-written as |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
174 ;; \\([$(5!3!4!5!:!?!@!I(B]$(5!i(B\\)\\|[$(5!3(B-$(5!X(B] |
17052 | 175 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
176 (defconst devanagari-full-cons |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
177 "\\(\\([$(5!3!4!5!:!?!@!I(B]$(5!i(B\\)\\|[$(5!3(B-$(5!X$.$E"%(B]\\)" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
178 "Devanagari full consonant") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
179 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
180 (defconst devanagari-pure-cons |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
181 (concat "\\(" devanagari-full-cons "$(5!h(B\\)") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
182 "Devanagari pure consonant") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
183 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
184 (defconst devanagari-matra |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
185 "\\(\\([$(5!_![!\(B]$(5!i(B\\)\\|[$(5!Z(B-$(5!g#K#L#M(B]\\)" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
186 "Devanagari Matra Signs. '$(5#K#L#M(B' can also be created from the combination |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
187 of '$(5!_![!\(B' and nukta sign.") |
17052 | 188 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
189 (defconst devanagari-vowel |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
190 "\\(\\([$(5!*!&!'(B]$(5!i(B\\)\\|[$(5!$(B-$(5!2#&#'#*(B]\\)" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
191 "Devanagari Vowels. '$(5#&#'#*(B' can also be created from the combination |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
192 of '$(5!*!&!'(B' and nukta sign.") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
193 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
194 (defconst devanagari-vowel-syllable |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
195 (concat devanagari-vowel "[$(5!!!"(B]?") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
196 "Devanagari vowel syllable.") |
17052 | 197 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
198 (defconst devanagari-cons-syllable |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
199 (concat devanagari-pure-cons "?" devanagari-pure-cons "?" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
200 devanagari-pure-cons "?" devanagari-pure-cons "$") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
201 "Devanagari consonant syllable") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
202 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
203 (defconst devanagari-cons-vowel-syllable |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
204 (concat "\\(" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
205 devanagari-pure-cons "?" devanagari-pure-cons "?" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
206 devanagari-pure-cons "?" devanagari-pure-cons "\\)?" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
207 devanagari-full-cons devanagari-matra "?[$(5!!!"(B]?") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
208 "Devanagari consonant vowel syllable.") |
17052 | 209 |
210 ;; | |
211 ;; Also, digits and virams should be processed other than syllables. | |
212 ;; | |
213 ;; In IS 13194, Avagrah is obtained by Nukta after Viram, and | |
214 ;; OM is obtained by Nukta after Chandrabindu | |
215 ;; | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
216 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
217 (defconst devanagari-digit-viram-visarga |
22520
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
218 "[$(5!q(B-$(5!z!j!#(B]") |
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
219 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
220 (defconst devanagari-other-sign |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
221 "\\([$(5!!!j(B]$(5!i(B\\)\\|\\([$(5#!#J(B]\\)") |
17052 | 222 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
223 (defconst devanagari-composite-glyph-unit |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
224 (concat "\\(" devanagari-cons-syllable |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
225 "\\)\\|\\(" devanagari-vowel-syllable |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
226 "\\)\\|\\(" devanagari-cons-vowel-syllable |
22520
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
227 "\\)\\|\\(" devanagari-other-sign |
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
228 "\\)\\|\\(" devanagari-digit-viram-visarga "\\)") |
17052 | 229 "Regexp matching to Devanagari string to be composed form one glyph.") |
230 | |
231 ;;(put-charset-property charset-devanagari-1-column | |
232 ;; 'char-to-glyph 'devanagari-compose-string) | |
233 ;;(put-charset-property charset-devanagari-2-column | |
234 ;; 'char-to-glyph 'devanagari-compose-string) | |
235 | |
236 ;; Sample | |
237 ;; | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
238 ;;(string-match devanagari-cons-vowel-syllable-examine "$(5!X![(B") => 0 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
239 ;;(string-match devanagari-cons-vowel-syllable-examine "$(5!F!h!D!\(B") => 0 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
240 ;;(string-match devanagari-cons-vowel-syllable-examine "$(5!X![!F!h!D!\(B") => 0 |
17052 | 241 |
242 ;; | |
243 ;; Steps toward the composition | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
244 ;; Converting Character Codes to Composite Glyph. |
17052 | 245 ;; |
246 ;; Example : $(5!X![(B/$(5!F!h!D!\(B | |
247 ;; | |
248 ;; First, convert Characters to appropriate glyphs. | |
249 ;; | |
250 ;; => $(5!X![(B/$(5"F!D!\(B | |
251 ;; | |
252 ;; Then, determine the base glyph, apply-orders and apply-rules. | |
253 ;; | |
254 ;; => $(5!X(B (ml.mr) $(5![(B / $(5!D(B (ml.mr) $(5"F(B (mr ml) $(5!\(B | |
255 ;; | |
256 ;; Finally, convert 2-column glyphs to 1-column glyph | |
257 ;; if such a glyph exist. | |
258 ;; | |
26894 | 259 ;; => $(6!X(B (ml.mr) $(6![(B / $(6!D(B (ml.mr) $(6"F(B (mr ml) $(6!\(B |
17052 | 260 ;; |
261 ;; Compose the glyph. | |
262 ;; | |
26894 | 263 ;; => 4$(6!Xt%![0!X![1(B/4$(6!Dt%"Fv#!\0!D"F!\1(B |
264 ;; => 4$(6!Xt%![0!X![14!Dt%"Fv#!\0!D"F!\1(B | |
17052 | 265 ;; |
266 | |
267 ;; | |
268 ;; Phase 1: Converting Character Code to Glyph Code. | |
269 ;; | |
270 ;; | |
271 ;; IMPORTANT: | |
26894 | 272 ;; There may be many rules that you many want to suppress. |
17052 | 273 ;; In that case, please comment out that rule. |
274 ;; | |
275 ;; RULES WILL BE EVALUATED FROM FIRST TO LAST. | |
276 ;; PUT MORE SPECIFIC RULES FIRST. | |
277 ;; | |
278 ;; TO DO: | |
279 ;; Prepare multiple specific list of rules for each languages | |
26894 | 280 ;; that adopt Devanagari script. |
17052 | 281 ;; |
282 | |
283 (defconst devanagari-char-to-glyph-rules | |
284 '( | |
285 | |
286 ;; `r' at the top of syllable and followed by other consonants. | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
287 ;; ("[^$(5!h(B]\\($(5!O!h(B\\)[$(5!3(B-$(5!X(B]" "$(5"p(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
288 ("^\\($(5!O!h(B\\)[$(5!3(B-$(5!X(B]" "$(5"p(B") |
17052 | 289 |
290 ;; Ligature Rules | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
291 ("\\($(5!3!h!B!h!O!h!M(B\\)" "$(5$!(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
292 ("\\($(5!3!h!B!h!T(B\\)" "$(5$"(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
293 ("\\($(5!3!h!B!h!M(B\\)" "$(5$#(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
294 ("\\($(5!3!h!F!h!M(B\\)" "$(5$$(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
295 ("\\($(5!3!h!O!h!M(B\\)" "$(5$%(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
296 ("\\($(5!3!h!O(B\\)" "$(5"#(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
297 ("\\($(5!3!h!T!h!M(B\\)" "$(5$&(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
298 ("\\($(5!3!h(B\\)$(5!3!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"3(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
299 ("\\($(5!3!h!3(B\\)" "$(5$'(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
300 ("\\($(5!3!h(B\\)$(5!B!h!O(B" "$(5"3(B") ; Special Rules for "k-tr" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
301 ("\\($(5!3!h!B(B\\)" "$(5$((B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
302 ("\\($(5!3!h!F(B\\)" "$(5$)(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
303 ("\\($(5!3!h!L(B\\)" "$(5$*(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
304 ("\\($(5!3!h!M(B\\)" "$(5$+(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
305 ("\\($(5!3!h!Q(B\\)" "$(5$,(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
306 ("\\($(5!3!h!T(B\\)" "$(5$-(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
307 ("\\($(5!3!h!V!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"l(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
308 ("\\($(5$.!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"l(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
309 ("\\($(5!3!h!V(B\\)" "$(5$.(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
310 ("\\($(5!3!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"3(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
311 ("\\($(5!3!i!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"s(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
312 ("\\($(5!3!i(B\\)" "$(5#3(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
313 ("\\($(5!4!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"4(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
314 ("\\($(5!4!i!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"t(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
315 ("\\($(5!4!i(B\\)" "$(5#4(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
316 ("\\($(5!5!h!O!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"`(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
317 ("\\($(5!5!h!O(B\\)" "$(5"$(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
318 ("\\($(5!5!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"5(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
319 ("\\($(5!5!i!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"u(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
320 ("\\($(5!5!i(B\\)" "$(5#5(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
321 ("\\($(5!6!h!F!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"a(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
322 ("\\($(5!6!h!F(B\\)" "$(5$/(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
323 ; Slot |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
324 ("\\($(5!6!h!O(B\\)" "$(5!6"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
325 ("\\($(5!6!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"6(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
326 ("\\($(5!7!h!3!h!B!h!M(B\\)" "$(5$0(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
327 ("\\($(5!7!h!3!h!V!h!T(B\\)" "$(5$1(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
328 ("\\($(5!7!h!3!h!B(B\\)" "$(5$2(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
329 ("\\($(5!7!h!3!h!V(B\\)" "$(5$3(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
330 ("\\($(5!7!h!3!h!O(B\\)" "$(5$9"q(B") ; Special Rule. May be precomposed font needed. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
331 ("\\($(5!7!h!6!h!O(B\\)" "$(5$4(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
332 ("\\($(5!7!h!3!h!M(B\\)" "$(5$5(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
333 ("\\($(5!7!h!4!h!M(B\\)" "$(5$6(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
334 ("\\($(5!7!h!5!h!M(B\\)" "$(5$7(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
335 ("\\($(5!7!h!6!h!M(B\\)" "$(5$8(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
336 ("\\($(5!7!h!3(B\\)" "$(5$9(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
337 ("\\($(5!7!h!4(B\\)" "$(5$:(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
338 ("\\($(5!7!h!5!h!O(B\\)" "$(5$;"q(B") ; Special Rule. May be precomposed font needed. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
339 ("\\($(5!7!h!5(B\\)" "$(5$;(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
340 ("\\($(5!7!h!6(B\\)" "$(5$<(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
341 ("\\($(5!7!h!7(B\\)" "$(5$=(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
342 ("\\($(5!7!h!F(B\\)" "$(5$>(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
343 ("\\($(5!7!h!L(B\\)" "$(5$?(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
344 ("\\($(5!7!h!M(B\\)" "$(5$@(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
345 ("\\($(5!8!h(B\\)[$(5!8!<(B]$(5!h(B" "$(5"8(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
346 ("\\($(5!8!h!8(B\\)" "$(5$A(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
347 ("\\($(5!8!h!<(B\\)" "$(5$B(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
348 ("\\($(5!8!h!O!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"8"q(B") ; Half Form Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
349 ("\\($(5!8!h!O(B\\)" "$(5!8"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
350 ("\\($(5!8!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"8(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
351 ("\\($(5!9!h!M(B\\)" "$(5$C(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
352 ("\\($(5!:!h!O(B\\)" "$(5$D(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
353 ("\\($(5!:!h!<!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"m(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
354 ("\\($(5!:!h!<(B\\)" "$(5$E(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
355 ("\\($(5!:!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5":(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
356 ("\\($(5!:!i!h!O(B\\)" "$(5"!(B") ; Nukta Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
357 ("\\($(5!:!i!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"z(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
358 ("\\($(5!:!i(B\\)" "$(5#:(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
359 ("\\($(5!;!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5";(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
360 ("\\($(5!<!h(B\\)$(5!8!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"<(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
361 ("\\($(5!<!h!8(B\\)" "$(5$F(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
362 ("\\($(5!<!h(B\\)$(5!:!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"<(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
363 ("\\($(5!<!h!:(B\\)" "$(5$G(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
364 ("\\($(5!<!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"<(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
365 ("\\($(5!=!h!3(B\\)" "$(5$H(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
366 ("\\($(5!=!h!=(B\\)" "$(5$I(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
367 ("\\($(5!=!h!>(B\\)" "$(5$J(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
368 ("\\($(5!=!h!M(B\\)" "$(5$K(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
369 ("\\($(5!>!h!M(B\\)" "$(5$L(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
370 ("\\($(5!?!h!5!h!M(B\\)" "$(5$M(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
371 ("\\($(5!?!h!6!h!O(B\\)" "$(5$N(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
372 ("\\($(5!?!h!O!h!M(B\\)" "$(5$O(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
373 ("\\($(5!?!h!5(B\\)" "$(5$P(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
374 ("\\($(5!?!h!6(B\\)" "$(5$Q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
375 ("\\($(5!?!h!?(B\\)" "$(5$R(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
376 ("\\($(5!?!h!L(B\\)" "$(5$S(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
377 ("\\($(5!?!h!M(B\\)" "$(5$T(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
378 ("\\($(5!?!i(B\\)" "$(5#?(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
379 ("\\($(5!@!h!M(B\\)" "$(5$`(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
380 ("\\($(5!@!i(B\\)" "$(5#@(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
381 ("\\($(5!A!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"A(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
382 ("\\($(5!B!h(B\\)$(5!B!h!O(B" "$(5"B(B") ; Special Rule for "t-tr" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
383 ("\\($(5!B!h!B!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"c(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
384 ("\\($(5!B!h!B(B\\)" "$(5$a(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
385 ("\\($(5!B!h!F(B\\)" "$(5$b(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
386 ("\\($(5!B!h!O!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"d(B") ; Half Form Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
387 ("\\($(5!B!h!O(B\\)" "$(5"%(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
388 ("\\($(5!B!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"B(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
389 ("\\($(5!C!h!O(B\\)" "$(5!C"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
390 ("\\($(5!C!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"C(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
391 ("\\($(5!D!h!D!h!M(B\\)" "$(5$c(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
392 ("\\($(5!D!h!E!h!M(B\\)" "$(5$d(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
393 ("\\($(5!D!h!K!h!M(B\\)" "$(5$e(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
394 ("\\($(5!D!h!K!h!O(B\\)" "$(5$r"r(B") ; Special Case for "dbhr" ; *** |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
395 ("\\($(5!D!h!O!h!M(B\\)" "$(5$f(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
396 ("\\($(5!D!h!T!h!M(B\\)" "$(5$g(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
397 ("\\($(5!D!h!5!h!O(B\\)" "$(5$h(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
398 ("\\($(5!D!h!6!h!O(B\\)" "$(5$i(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
399 ("\\($(5!D!h!D!h!T(B\\)" "$(5$j(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
400 ("\\($(5!D!h!E!h!T(B\\)" "$(5$k(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
401 ("\\($(5!D!h(B\\)$(5!E!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5!D!h(B") ; Special Half Form (for ddhra) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
402 ("\\($(5!D!h!5(B\\)" "$(5$l(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
403 ("\\($(5!D!h!6(B\\)" "$(5$m(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
404 ("\\($(5!D!h!D(B\\)" "$(5$n(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
405 ("\\($(5!D!h!E(B\\)" "$(5$o(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
406 ("\\($(5!D!h!F(B\\)" "$(5$p(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
407 ("\\($(5!D!h(B\\)$(5!J!h(B" "$(5!D!h(B") ; Suppressing "db-" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
408 ("\\($(5!D!h!J(B\\)" "$(5$q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
409 ("\\($(5!D!h!K(B\\)" "$(5$r(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
410 ("\\($(5!D!h!L(B\\)" "$(5$s(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
411 ("\\($(5!D!h!M(B\\)" "$(5$t(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
412 ("\\($(5!D!h!T(B\\)" "$(5$u(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
413 ("\\($(5!E!h!F!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"e(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
414 ("\\($(5!E!h!F(B\\)" "$(5$v(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
415 ("\\($(5!E!h!O!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"f(B") ; Half Form Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
416 ("\\($(5!E!h!O(B\\)" "$(5!E"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
417 ("\\($(5!E!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"E(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
418 ("\\($(5!F!h!F!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"k(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
419 ("\\($(5!F!h!F(B\\)" "$(5$w(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
420 ("\\($(5!F!h!O(B\\)" "$(5!F"q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
421 ("\\($(5!F!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"F(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
422 ("\\($(5!G!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"G(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
423 ("\\($(5!H!h(B\\)$(5!B!h!O(B" "$(5"H(B") ; Special Rule for "p-tr" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
424 ("\\($(5!H!h!B!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"g(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
425 ("\\($(5!H!h!B(B\\)" "$(5$x(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
426 ("\\($(5!H!h!F(B\\)" "$(5$y(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
427 ("\\($(5!H!h!Q(B\\)" "$(5$z(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
428 ("\\($(5!H!h!O(B\\)" "$(5"&(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
429 ("\\($(5!H!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"H(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
430 ("\\($(5!I!h!O(B\\)" "$(5"'(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
431 ("\\($(5!I!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"I(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
432 ("\\($(5!I!i!h!O(B\\)" "$(5""(B") ; Nukta Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
433 ("\\($(5!I!i!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"y(B") ; Nukta Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
434 ("\\($(5!I!i(B\\)" "$(5#I(B") ; Nukta |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
435 ("\\($(5!J!h(B\\)$(5!F!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"J(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
436 ("\\($(5!J!h!F(B\\)" "$(5${(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
437 ("\\($(5!J!h(B\\)$(5!J!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"J(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
438 ("\\($(5!J!h!J(B\\)" "$(5$|(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
439 ("\\($(5!J!h(B\\)$(5!T!h(B[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"J(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
440 ("\\($(5!J!h!T(B\\)" "$(5$}(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
441 ("\\($(5!J!h!O(B\\)" "$(5!J"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
442 ("\\($(5!J!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"J(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
443 ("\\($(5!K!h!F(B\\)" "$(5$~(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
444 ("\\($(5!K!h!O(B\\)" "$(5!K"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
445 ("\\($(5!K!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"K(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
446 ("\\($(5!L!h!F(B\\)" "$(5#P(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
447 ("\\($(5!L!h!Q(B\\)" "$(5#Q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
448 ("\\($(5!L!h!O(B\\)" "$(5!L"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
449 ("\\($(5!L!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"L(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
450 ("\\($(5!M!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"M(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
451 ("\\($(5!N!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"N(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
452 ;; special form for "ru". |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
453 ("\\($(5!O!](B\\)" "$(5",(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
454 ("\\($(5!O!^(B\\)" "$(5"-(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
455 ("\\($(5!P!](B\\)" "$(5".(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
456 ("\\($(5!P!^(B\\)" "$(5"/(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
457 ;; |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
458 ("\\($(5!Q!h!Q(B\\)" "$(5#`(B" sanskrit) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
459 ("\\($(5!Q!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"Q(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
460 ("\\($(5!R!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"R(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
461 ("\\($(5!S!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"S(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
462 ("\\($(5!T!h!F(B\\)" "$(5#a(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
463 ("\\($(5!T!h!T(B\\)" "$(5#b(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
464 ("\\($(5!T!h!O(B\\)" "$(5!T"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
465 ("\\($(5!T!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"T(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
466 ("\\($(5!U!h!8!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"h(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
467 ("\\($(5!U!h!8(B\\)" "$(5#c(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
468 ("\\($(5!U!h!F(B\\)" "$(5#d(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
469 ("\\($(5!U!h!J(B\\)" "$(5#e(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
470 ("\\($(5!U!h!Q(B\\)" "$(5#f(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
471 ("\\($(5!U!h(B\\)$(5!T!h!O(B" "$(5"U(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
472 ("\\($(5!U!h!T!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"j(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
473 ; ("\\($(5!U!h!T(B\\)" "$(5#g(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
474 ("\\($(5!U!h!O!h!T(B\\)" "$(5#g(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
475 ("\\($(5!U!h!O!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"i(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
476 ("\\($(5!U!h!O(B\\)" "$(5")(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
477 ("\\($(5!U!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"U(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
478 ("\\($(5!V!h!=!h!O!h!M(B\\)" "$(5#h(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
479 ("\\($(5!V!h!=!h!M(B\\)" "$(5#i(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
480 ("\\($(5!V!h!=!h!T(B\\)" "$(5#j(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
481 ("\\($(5!V!h!=(B\\)" "$(5#k(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
482 ("\\($(5!V!h!>(B\\)" "$(5#l(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
483 ("\\($(5!V!h!O(B\\)" "$(5!V"q(B") ; Post "r" |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
484 ("\\($(5!V!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"V(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
485 ("\\($(5!W!h!F!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"W"F(B") ; Special Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
486 ("\\($(5!W!h!F(B\\)" "$(5#m(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
487 ("\\($(5!W!h!O(B\\)" "$(5#n(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
488 ("\\($(5!W!h(B\\)[$(5!3(B-$(5!N!P(B-$(5!X(B]" "$(5"W(B") ; Half Form |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
489 ("\\($(5!X!h!A(B\\)" "$(5#p(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
490 ("\\($(5!X!h!F(B\\)" "$(5#q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
491 ("\\($(5!X!h!L(B\\)" "$(5#r(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
492 ("\\($(5!X!h!M(B\\)" "$(5#s(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
493 ("\\($(5!X!h!O(B\\)" "$(5#t(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
494 ("\\($(5!X!h!Q(B\\)" "$(5#u(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
495 ("\\($(5!X!h!T(B\\)" "$(5#v(B") |
17052 | 496 ;; Special Ligature Rules |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
497 ("\\($(5!X!_(B\\)" "$(5#R(B") |
17052 | 498 |
499 ;; For consonants other than listed above, glyph-composition will | |
500 ;; be applied. If the consonant which is preceding "$(5!O(B" does not | |
501 ;; have the vertical line (such as "$(5!?(B"), "$(5"r(B" is put beneath the | |
502 ;; consonant. | |
503 ;; | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
504 ("[$(5!7!9!=!>!?!@!D!O!P!R!S!X(B]\\($(5!h!O(B\\)" "$(5"r(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
505 ("[$(5!6!8!C!E!F!H!J!K!L!M!T!V(B]\\($(5!h!O(B\\)" "$(5"q(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
506 ("$(5!?!i(B\\($(5!h!O(B\\)" "$(5"r(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
507 ("$(5!@!i(B\\($(5!h!O(B\\)" "$(5"r(B") |
17052 | 508 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
509 ;; Nukta with Non-Consonants |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
510 ("\\($(5!!!i(B\\)" "$(5#!(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
511 ("\\($(5!&!i(B\\)" "$(5#&(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
512 ("\\($(5!'!i(B\\)" "$(5#'(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
513 ("\\($(5!*!i(B\\)" "$(5#*(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
514 ("\\($(5![!i(B\\)" "$(5#L(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
515 ("\\($(5!\!i(B\\)" "$(5#M(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
516 ("\\($(5!_!i(B\\)" "$(5#K(B") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
517 ("\\($(5!j!i(B\\)" "$(5#J(B") |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
518 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
519 ;; Special rule for "r + some vowels" |
22520
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
520 ("\\($(5!O!_!i(B\\)" "$(5#*"p(B") |
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
521 ("\\($(5!O![!i(B\\)" "$(5#&"p(B") |
901451c61b3f
(devanagari-digit-viram-visarga): Set the
Kenichi Handa <handa@m17n.org>
parents:
21442
diff
changeset
|
522 ("\\($(5!O!\!i(B\\)" "$(5#'"p(B") |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
523 ("\\($(5!O!_(B\\)" "$(5!*"p(B") |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
524 ;; If everything fails, "y" will connect to the front consonant. |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
525 ("\\($(5!h!M(B\\)" "$(5"](B") |
17052 | 526 ) |
527 "Alist of regexps of Devanagari character sequences vs composed characters.") | |
528 | |
529 (let ((rules devanagari-char-to-glyph-rules)) | |
530 (while rules | |
531 (let ((rule (car rules)) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
532 (chars) (char) (glyphs) (glyph)) |
17052 | 533 (setq rules (cdr rules)) |
534 (string-match "\\\\(\\(.+\\)\\\\)" (car rule)) | |
535 (setq chars (substring (car rule) (match-beginning 1) (match-end 1))) | |
536 (setq char (string-to-char chars)) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
537 (setq glyphs (cdr rule)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
538 (setq glyph (string-to-char (car glyphs))) |
17052 | 539 (put-char-code-property |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
540 char 'char-to-glyph |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
541 ;; We don't "cons" it since priority is top to down. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
542 (append (get-char-code-property char 'char-to-glyph) (list rule))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
543 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
544 (if (and (< ?(5z(B glyph) ; Glyphs only. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
545 (null (get-char-code-property glyph 'glyph-to-char))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
546 ; One glyph may corresponds to multiple characters, |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
547 ; e.g., surrounding vowel in Tamil, etc. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
548 ; but for Devanagari, we put this restriction |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
549 ; to make sure the fact that one glyph corresponds to one char. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
550 (put-char-code-property |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
551 glyph 'glyph-to-char |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
552 (cons (list (car glyphs) chars) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
553 (get-char-code-property glyph 'glyph-to-char) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
554 )))))) |
17052 | 555 |
556 ;; | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
557 ;; Function used in both characters-to-glyphs conversion and |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
558 ;; glyphs-to-characters conversion. |
17052 | 559 ;; |
560 | |
26894 | 561 (defun max-match-len (regexp) |
562 "Return the maximum length of text that can match the pattern REGEXP. | |
563 Only [...] pattern of regexp is recognized." | |
564 (let ((len 0) | |
565 (index 0)) | |
566 (while (string-match "\\[\\([^\]]\\)+\\]" regexp index) | |
567 (setq len (+ len (- (match-beginning 0) index) 1) | |
568 index (match-end 0))) | |
569 len)) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
570 |
26894 | 571 ;; Return t iff at least one member appears in both LIST1 and LIST2. |
572 (defun intersecting-p (list1 list2) | |
20839 | 573 (let ((found nil)) |
574 (while (and list1 (not found)) | |
575 (if (memq (car list1) list2) | |
576 (setq found t) | |
577 (setq list1 (cdr list1)))) | |
578 found)) | |
579 | |
26894 | 580 (defun string-conversion-by-rule (source symbol &rest specs) |
581 "Convert string SOURCE by rules stored in SYMBOL property of each character. | |
582 The remaining arguments forms a list SPECS that restricts applicable rules. | |
583 | |
584 The rules has the form ((REGEXP STR RULE-SPEC ...) ...). | |
585 Each character sequence in STRING that matches REGEXP is | |
586 replaced by STR. | |
587 | |
588 If SPECS is nil, only rules with no RULE-SPECs is applied. Otherwise | |
589 rules with no RULE-SPECS and rules that have at least one member of | |
590 SPECS in RULE-SPECs is applied. | |
591 | |
592 Rules are tested in the order of the list, thus more specific rules | |
593 should be placed in front of less specific rules. | |
594 | |
595 If rule is given in the forms of regexp '...\\(...\\)...', a character | |
596 sequence that matches the pattern inside of the parenthesis is the | |
597 subject of the match. Otherwise, the entire expression is the subject | |
598 of the match." | |
17052 | 599 (let ((pos 0) |
600 (dst-str "")) | |
26894 | 601 (while (< pos (length source)) |
17052 | 602 (let ((found nil) |
603 (rules (get-char-code-property | |
604 (string-to-char | |
26894 | 605 (substring source pos)) symbol))) |
17052 | 606 (while rules |
607 (let* ((rule (car rules)) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
608 (regexp (car rule)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
609 (replace-str (car (cdr rule))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
610 (rule-specs (cdr (cdr rule))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
611 search-pos) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
612 (if (not (or (null rule-specs) |
26894 | 613 (intersecting-p specs rule-specs))) |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
614 (setq rules (cdr rules)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
615 (if (null (string-match "\\\\(.+\\\\)" regexp)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
616 (progn |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
617 (setq regexp (concat "\\(" regexp "\\)")) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
618 (setq search-pos pos)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
619 (setq search-pos (- pos (max-match-len |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
620 (substring regexp |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
621 (string-match "^[^\\\\]*" regexp) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
622 (match-end 0)))))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
623 (if (< search-pos 0) (setq search-pos 0)) |
26894 | 624 (if (string-match regexp source search-pos) |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
625 (if (= (match-beginning 1) pos) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
626 (progn |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
627 (setq dst-str (concat dst-str replace-str)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
628 (setq rules nil) ; Get out of the loop. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
629 (setq found t) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
630 ;; proceed `pos' for replaced characters. |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
631 (setq pos (match-end 1))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
632 (setq rules (cdr rules))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
633 (setq rules (cdr rules)))))) |
17052 | 634 ;; proceed to next position |
635 (if (not found) | |
26894 | 636 (setq dst-str (concat dst-str (substring source pos (1+ pos))) |
20839 | 637 pos (1+ pos))))) |
17052 | 638 dst-str)) |
639 | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
640 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
641 ;; |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
642 ;; Convert Character Code to Glyph Code |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
643 ;; |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
644 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
645 ;;;###autoload |
26894 | 646 (defun char-to-glyph-devanagari (string &rest langs) |
647 "Convert Devanagari characters in STRING to Devanagari glyphs. | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
648 Ligatures and special rules are processed." |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
649 (apply |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
650 'string-conversion-by-rule |
26894 | 651 (append (list string 'char-to-glyph) langs))) |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
652 |
17052 | 653 ;; Example: |
654 ;;(char-to-glyph-devanagari "$(5!X![!F!h!D!\(B") => "$(5!X!["F!D!\(B" | |
655 ;;(char-to-glyph-devanagari "$(5!O!Z!V!h!=!h!O![!M(B") => ??? | |
656 | |
657 ;; | |
658 ;; Phase 2: Compose Glyphs to form One Glyph. | |
659 ;; | |
660 | |
26894 | 661 ;; Each list consists of glyph, application-priority and application-direction. |
17052 | 662 ;; |
663 ;; Glyphs will be ordered from low priority number to high priority number. | |
664 ;; If application-priority is omitted, it is assumed to be 0. | |
665 ;; If application-direction is omitted, it is asumbed to be '(mr . ml). | |
666 | |
667 (defconst devanagari-composition-rules | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
668 '((?$(5!!(B 0 (tr . br)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
669 (?$(5!"(B 0 (mr . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
670 (?$(5!#(B 0) |
17052 | 671 (?$(5!$(B 0) |
672 (?$(5!%(B 0) | |
673 (?$(5!&(B 0) | |
674 (?$(5!'(B 0) | |
675 (?$(5!((B 0) | |
676 (?$(5!)(B 0) | |
677 (?$(5!*(B 0) | |
678 (?$(5!+(B 0) | |
679 (?$(5!,(B 0) | |
680 (?$(5!-(B 0) | |
681 (?$(5!.(B 0) | |
682 (?$(5!/(B 0) | |
683 (?$(5!0(B 0) | |
684 (?$(5!1(B 0) | |
685 (?$(5!2(B 0) | |
686 (?$(5!3(B 0) | |
687 (?$(5!4(B 0) | |
688 (?$(5!5(B 0) | |
689 (?$(5!6(B 0) | |
690 (?$(5!7(B 0) | |
691 (?$(5!8(B 0) | |
692 (?$(5!9(B 0) | |
693 (?$(5!:(B 0) | |
694 (?$(5!;(B 0) | |
695 (?$(5!<(B 0) | |
696 (?$(5!=(B 0) | |
697 (?$(5!>(B 0) | |
698 (?$(5!?(B 0) | |
699 (?$(5!@(B 0) | |
700 (?$(5!A(B 0) | |
701 (?$(5!B(B 0) | |
702 (?$(5!C(B 0) | |
703 (?$(5!D(B 0) | |
704 (?$(5!E(B 0) | |
705 (?$(5!F(B 0) | |
706 (?$(5!G(B 0) | |
707 (?$(5!H(B 0) | |
708 (?$(5!I(B 0) | |
709 (?$(5!J(B 0) | |
710 (?$(5!K(B 0) | |
711 (?$(5!L(B 0) | |
712 (?$(5!M(B 0) | |
713 (?$(5!N(B 0) | |
714 (?$(5!O(B 0) | |
715 (?$(5!P(B 0) | |
716 (?$(5!Q(B 0) | |
717 (?$(5!R(B 0) | |
718 (?$(5!S(B 0) | |
719 (?$(5!T(B 0) | |
720 (?$(5!U(B 0) | |
721 (?$(5!V(B 0) | |
722 (?$(5!W(B 0) | |
723 (?$(5!X(B 0) | |
724 (?$(5!Y(B 0) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
725 (?$(5!Z(B 0) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
726 (?$(5![(B 0 (ml . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
727 (?$(5!\(B 0) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
728 (?$(5!](B 0 (br . tr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
729 (?$(5!^(B 0 (br . tr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
730 (?$(5!_(B 0 (br . tr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
731 (?$(5!`(B 0 (mr . mr)) ; (tc . bc) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
732 (?$(5!a(B 0 (mr . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
733 (?$(5!b(B 0 (mr . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
734 (?$(5!c(B 0 (mr . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
735 (?$(5!d(B 0) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
736 (?$(5!e(B 0) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
737 (?$(5!f(B 0) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
738 (?$(5!g(B 0) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
739 (?$(5!h(B 0 (br . tr)) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
740 (?$(5!i(B 0 (br . tr)) |
17052 | 741 (?$(5!j(B 0) |
742 (nil 0) | |
743 (nil 0) | |
744 (nil 0) | |
745 (nil 0) | |
746 (nil 0) | |
747 (nil 0) | |
748 (?$(5!q(B 0) | |
749 (?$(5!r(B 0) | |
750 (?$(5!s(B 0) | |
751 (?$(5!t(B 0) | |
752 (?$(5!u(B 0) | |
753 (?$(5!v(B 0) | |
754 (?$(5!w(B 0) | |
755 (?$(5!x(B 0) | |
756 (?$(5!y(B 0) | |
757 (?$(5!z(B 0) | |
758 (nil 0) | |
759 (nil 0) | |
760 (nil 0) | |
761 (nil 0) | |
762 (?$(5"!(B 0) | |
763 (?$(5""(B 0) | |
764 (?$(5"#(B 0) | |
765 (?$(5"$(B 0) | |
766 (?$(5"%(B 0) | |
767 (?$(5"&(B 0) | |
768 (?$(5"'(B 0) | |
769 (?$(5"((B 0) | |
770 (?$(5")(B 0) | |
771 (?$(5"*(B 0) | |
772 (?$(5"+(B 0) | |
773 (?$(5",(B 0) | |
774 (?$(5"-(B 0) | |
775 (?$(5".(B 0) | |
776 (?$(5"/(B 0) | |
777 (?$(5"0(B 0) | |
778 (?$(5"1(B 0) | |
779 (?$(5"2(B 0) | |
780 (?$(5"3(B 0) | |
781 (?$(5"4(B 0) | |
782 (?$(5"5(B 0) | |
783 (?$(5"6(B 0) | |
784 (?$(5"7(B 0) | |
785 (?$(5"8(B 0) | |
786 (?$(5"9(B 0) | |
787 (?$(5":(B 0) | |
788 (?$(5";(B 0) | |
789 (?$(5"<(B 0) | |
790 (?$(5"=(B 0) | |
791 (?$(5">(B 0) | |
792 (?$(5"?(B 0) | |
793 (?$(5"@(B 0) | |
794 (?$(5"A(B 0) | |
795 (?$(5"B(B 0) | |
796 (?$(5"C(B 0) | |
797 (?$(5"D(B 0) | |
798 (?$(5"E(B 0) | |
799 (?$(5"F(B 0) | |
800 (?$(5"G(B 0) | |
801 (?$(5"H(B 0) | |
802 (?$(5"I(B 0) | |
803 (?$(5"J(B 0) | |
804 (?$(5"K(B 0) | |
805 (?$(5"L(B 0) | |
806 (?$(5"M(B 0) | |
807 (?$(5"N(B 0) | |
808 (?$(5"O(B 0) | |
809 (?$(5"P(B 0) | |
810 (?$(5"Q(B 0) | |
811 (?$(5"R(B 0) | |
812 (?$(5"S(B 0) | |
813 (?$(5"T(B 0) | |
814 (?$(5"U(B 0) | |
815 (?$(5"V(B 0) | |
816 (?$(5"W(B 0) | |
817 (?$(5"X(B 0) | |
818 (?$(5"Y(B 0) | |
819 (?$(5"Z(B 0) | |
820 (?$(5"[(B 0) | |
821 (?$(5"\(B 0) | |
822 (?$(5"](B 0) | |
823 (?$(5"^(B 0) | |
824 (?$(5"_(B 0) | |
825 (?$(5"`(B 0) | |
826 (?$(5"a(B 0) | |
827 (?$(5"b(B 0) | |
828 (?$(5"c(B 0) | |
829 (?$(5"d(B 0) | |
830 (?$(5"e(B 0) | |
831 (?$(5"f(B 0) | |
832 (?$(5"g(B 0) | |
833 (?$(5"h(B 0) | |
834 (?$(5"i(B 0) | |
835 (?$(5"j(B 0) | |
836 (?$(5"k(B 0) | |
837 (?$(5"l(B 0) | |
838 (?$(5"m(B 0) | |
839 (?$(5"n(B 0) | |
840 (?$(5"o(B 0) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
841 (?$(5"p(B 10 (mr . mr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
842 (?$(5"q(B 0 (br . br)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
843 (?$(5"r(B 0 (br . tr)) |
17052 | 844 (?$(5"s(B 0) |
845 (?$(5"t(B 0) | |
846 (?$(5"u(B 0) | |
847 (?$(5"v(B 0) | |
848 (?$(5"w(B 0) | |
849 (?$(5"x(B 0) | |
850 (?$(5"y(B 0) | |
851 (?$(5"z(B 0) | |
852 (?$(5"{(B 0) | |
853 (?$(5"|(B 0) | |
854 (?$(5"}(B 0) | |
855 (?$(5"~(B 0) | |
856 (?$(5#!(B 0) | |
857 (?$(5#"(B 0) | |
858 (?$(5##(B 0) | |
859 (?$(5#$(B 0) | |
860 (?$(5#%(B 0) | |
861 (?$(5#&(B 0) | |
862 (?$(5#'(B 0) | |
863 (?$(5#((B 0) | |
864 (?$(5#)(B 0) | |
865 (?$(5#*(B 0) | |
866 (?$(5#+(B 0) | |
867 (?$(5#,(B 0) | |
868 (?$(5#-(B 0) | |
869 (?$(5#.(B 0) | |
870 (?$(5#/(B 0) | |
871 (?$(5#0(B 0) | |
872 (?$(5#1(B 0) | |
873 (?$(5#2(B 0) | |
874 (?$(5#3(B 0) | |
875 (?$(5#4(B 0) | |
876 (?$(5#5(B 0) | |
877 (?$(5#6(B 0) | |
878 (?$(5#7(B 0) | |
879 (?$(5#8(B 0) | |
880 (?$(5#9(B 0) | |
881 (?$(5#:(B 0) | |
882 (?$(5#;(B 0) | |
883 (?$(5#<(B 0) | |
884 (?$(5#=(B 0) | |
885 (?$(5#>(B 0) | |
886 (?$(5#?(B 0) | |
887 (?$(5#@(B 0) | |
888 (?$(5#A(B 0) | |
889 (?$(5#B(B 0) | |
890 (?$(5#C(B 0) | |
891 (?$(5#D(B 0) | |
892 (?$(5#E(B 0) | |
893 (?$(5#F(B 0) | |
894 (?$(5#G(B 0) | |
895 (?$(5#H(B 0) | |
896 (?$(5#I(B 0) | |
897 (?$(5#J(B 0) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
898 (?$(5#K(B 0 (br . tr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
899 (?$(5#L(B 0 (br . tr)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
900 (?$(5#M(B 0 (br . tr)) |
17052 | 901 (?$(5#N(B 0) |
902 (?$(5#O(B 0) | |
903 (?$(5#P(B 0) | |
904 (?$(5#Q(B 0) | |
905 (?$(5#R(B 0) | |
906 (?$(5#S(B 0) | |
907 (?$(5#T(B 0) | |
908 (?$(5#U(B 0) | |
909 (?$(5#V(B 0) | |
910 (?$(5#W(B 0) | |
911 (?$(5#X(B 0) | |
912 (?$(5#Y(B 0) | |
913 (?$(5#Z(B 0) | |
914 (?$(5#[(B 0) | |
915 (?$(5#\(B 0) | |
916 (?$(5#](B 0) | |
917 (?$(5#^(B 0) | |
918 (?$(5#_(B 0) | |
919 (?$(5#`(B 0) | |
920 (?$(5#a(B 0) | |
921 (?$(5#b(B 0) | |
922 (?$(5#c(B 0) | |
923 (?$(5#d(B 0) | |
924 (?$(5#e(B 0) | |
925 (?$(5#f(B 0) | |
926 (?$(5#g(B 0) | |
927 (?$(5#h(B 0) | |
928 (?$(5#i(B 0) | |
929 (?$(5#j(B 0) | |
930 (?$(5#k(B 0) | |
931 (?$(5#l(B 0) | |
932 (?$(5#m(B 0) | |
933 (?$(5#n(B 0) | |
934 (?$(5#o(B 0) | |
935 (?$(5#p(B 0) | |
936 (?$(5#q(B 0) | |
937 (?$(5#r(B 0) | |
938 (?$(5#s(B 0) | |
939 (?$(5#t(B 0) | |
940 (?$(5#u(B 0) | |
941 (?$(5#v(B 0) | |
942 (?$(5#w(B 0) | |
943 (?$(5#x(B 0) | |
944 (?$(5#y(B 0) | |
945 (?$(5#z(B 0) | |
946 (?$(5#{(B 0) | |
947 (?$(5#|(B 0) | |
948 (?$(5#}(B 0) | |
949 (?$(5#~(B 0) | |
950 (?$(5$!(B 0) | |
951 (?$(5$"(B 0) | |
952 (?$(5$#(B 0) | |
953 (?$(5$$(B 0) | |
954 (?$(5$%(B 0) | |
955 (?$(5$&(B 0) | |
956 (?$(5$'(B 0) | |
957 (?$(5$((B 0) | |
958 (?$(5$)(B 0) | |
959 (?$(5$*(B 0) | |
960 (?$(5$+(B 0) | |
961 (?$(5$,(B 0) | |
962 (?$(5$-(B 0) | |
963 (?$(5$.(B 0) | |
964 (?$(5$/(B 0) | |
965 (?$(5$0(B 0) | |
966 (?$(5$1(B 0) | |
967 (?$(5$2(B 0) | |
968 (?$(5$3(B 0) | |
969 (?$(5$4(B 0) | |
970 (?$(5$5(B 0) | |
971 (?$(5$6(B 0) | |
972 (?$(5$7(B 0) | |
973 (?$(5$8(B 0) | |
974 (?$(5$9(B 0) | |
975 (?$(5$:(B 0) | |
976 (?$(5$;(B 0) | |
977 (?$(5$<(B 0) | |
978 (?$(5$=(B 0) | |
979 (?$(5$>(B 0) | |
980 (?$(5$?(B 0) | |
981 (?$(5$@(B 0) | |
982 (?$(5$A(B 0) | |
983 (?$(5$B(B 0) | |
984 (?$(5$C(B 0) | |
985 (?$(5$D(B 0) | |
986 (?$(5$E(B 0) | |
987 (?$(5$F(B 0) | |
988 (?$(5$G(B 0) | |
989 (?$(5$H(B 0) | |
990 (?$(5$I(B 0) | |
991 (?$(5$J(B 0) | |
992 (?$(5$K(B 0) | |
993 (?$(5$L(B 0) | |
994 (?$(5$M(B 0) | |
995 (?$(5$N(B 0) | |
996 (?$(5$O(B 0) | |
997 (?$(5$P(B 0) | |
998 (?$(5$Q(B 0) | |
999 (?$(5$R(B 0) | |
1000 (?$(5$S(B 0) | |
1001 (?$(5$T(B 0) | |
1002 (?$(5$U(B 0) | |
1003 (?$(5$V(B 0) | |
1004 (?$(5$W(B 0) | |
1005 (?$(5$X(B 0) | |
1006 (?$(5$Y(B 0) | |
1007 (?$(5$Z(B 0) | |
1008 (?$(5$[(B 0) | |
1009 (?$(5$\(B 0) | |
1010 (?$(5$](B 0) | |
1011 (?$(5$^(B 0) | |
1012 (?$(5$_(B 0) | |
1013 (?$(5$`(B 0) | |
1014 (?$(5$a(B 0) | |
1015 (?$(5$b(B 0) | |
1016 (?$(5$c(B 0) | |
1017 (?$(5$d(B 0) | |
1018 (?$(5$e(B 0) | |
1019 (?$(5$f(B 0) | |
1020 (?$(5$g(B 0) | |
1021 (?$(5$h(B 0) | |
1022 (?$(5$i(B 0) | |
1023 (?$(5$j(B 0) | |
1024 (?$(5$k(B 0) | |
1025 (?$(5$l(B 0) | |
1026 (?$(5$m(B 0) | |
1027 (?$(5$n(B 0) | |
1028 (?$(5$o(B 0) | |
1029 (?$(5$p(B 0) | |
1030 (?$(5$q(B 0) | |
1031 (?$(5$r(B 0) | |
1032 (?$(5$s(B 0) | |
1033 (?$(5$t(B 0) | |
1034 (?$(5$u(B 0) | |
1035 (?$(5$v(B 0) | |
1036 (?$(5$w(B 0) | |
1037 (?$(5$x(B 0) | |
1038 (?$(5$y(B 0) | |
1039 (?$(5$z(B 0) | |
1040 (?$(5${(B 0) | |
1041 (?$(5$|(B 0) | |
1042 (?$(5$}(B 0) | |
1043 (?$(5$~(B 0) | |
1044 )) | |
1045 | |
1046 ;; Determine composition priority and rule of the array of Glyphs. | |
1047 ;; Sort the glyphs with their priority. | |
1048 | |
26894 | 1049 (defun devanagari-reorder-glyphs-for-composition (string start end) |
1050 (let ((pos start) | |
1051 (ordered-glyphs nil)) | |
1052 (while (< pos end) | |
1053 (let ((glyph (aref string pos))) | |
17052 | 1054 (setq pos (1+ pos)) |
1055 (setq ordered-glyphs | |
26894 | 1056 (append ordered-glyphs |
1057 (list (assq glyph devanagari-composition-rules)))))) | |
17052 | 1058 (sort ordered-glyphs '(lambda (x y) (< (car (cdr x)) (car (cdr y))))))) |
1059 | |
26894 | 1060 ! ;;(devanagari-compose-to-one-glyph "$(5"5!X![(B") => "4$(6!Xv#"5t%![0!X"5![1(B" |
17052 | 1061 |
1062 (defun devanagari-compose-to-one-glyph (devanagari-string) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1063 (let* ((o-glyph-list (devanagari-reorder-glyphs-for-composition |
26894 | 1064 devanagari-string 0 (length devanagari-string))) |
17052 | 1065 ;; List of glyphs to be composed. |
1066 (cmp-glyph-list (list (car (car o-glyph-list)))) | |
1067 (o-glyph-list (cdr o-glyph-list))) | |
1068 (while o-glyph-list | |
1069 (let* ((o-glyph (car o-glyph-list)) | |
1070 (glyph (if (< 2 (length o-glyph)) | |
1071 ;; default composition | |
1072 (list (car (cdr (cdr o-glyph))) (car o-glyph)) | |
1073 ;; composition with a specified rule | |
1074 (list '(mr . ml) (car o-glyph))))) | |
1075 (setq o-glyph-list (cdr o-glyph-list)) | |
1076 (setq cmp-glyph-list (append cmp-glyph-list glyph)))) | |
1077 ;; Before applying compose-chars, convert glyphs to | |
1078 ;; 1-column width if possible. | |
1079 (setq cmp-glyph-list (devanagari-wide-to-narrow cmp-glyph-list)) | |
1080 (if (= (length cmp-glyph-list) 1) (char-to-string (car cmp-glyph-list)) | |
1081 (apply 'compose-chars cmp-glyph-list)))) | |
1082 | |
26894 | 1083 (defun devanagari-composition-component (string &optional start end) |
1084 (or start (setq start 0)) | |
1085 (or end (setq end (length string))) | |
1086 (let* ((o-glyph-list (devanagari-reorder-glyphs-for-composition | |
1087 string start end)) | |
1088 ;; List of glyphs to be composed. | |
1089 (cmp-glyph-list (list (car (car o-glyph-list))))) | |
1090 (setq o-glyph-list (cdr o-glyph-list)) | |
1091 (while o-glyph-list | |
1092 (let* ((o-glyph (car o-glyph-list)) | |
1093 (glyph (if (< 2 (length o-glyph)) | |
1094 ;; default composition | |
1095 (list (car (cdr (cdr o-glyph))) (car o-glyph)) | |
1096 ;; composition with a specified rule | |
1097 (list '(mr . ml) (car o-glyph))))) | |
1098 (setq o-glyph-list (cdr o-glyph-list)) | |
1099 (setq cmp-glyph-list (append cmp-glyph-list glyph)))) | |
1100 ;; Convert glyphs to 1-column width if possible. | |
1101 (devanagari-wide-to-narrow cmp-glyph-list))) | |
1102 | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1103 ;; Utility function for Phase 2.5 |
26894 | 1104 |
1105 ;; Check whether GLYPH is a Devanagari vertical modifier or not. | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1106 ;; If it is a vertical modifier, whether it should be 1-column shape or not |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1107 ;; depends on previous non-vertical modifier. |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1108 (defun devanagari-vertical-modifier-p (glyph) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1109 (string-match (char-to-string glyph) |
21442 | 1110 "[$(5!"!]!^!_!`!a!b!c!h!i"p"q"r#K#L#M(B]")) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1111 |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1112 (defun devanagari-non-vertical-modifier-p (glyph) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1113 (string-match (char-to-string glyph) |
21442 | 1114 ; "[$(5!Z![!\!d!e!f!g(B]")) |
1115 "[$(5![(B]")) | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1116 |
21442 | 1117 (defun devanagari-wide-to-narrow-char (char) |
26894 | 1118 "Convert Devanagari character CHAR to the corresponding narrow character. |
1119 If there's no corresponding narrow character, return CHAR as is." | |
21442 | 1120 (let ((narrow (cdr (assq char devanagari-1-column-char)))) |
26894 | 1121 (or narrow char))) |
17052 | 1122 |
1123 ;; | |
26894 | 1124 ;; Phase 2.5 Convert appropriate character to 1-column shape. |
17052 | 1125 ;; |
1126 ;; This is temporary and should be removed out when Emacs supports | |
1127 ;; variable width characters. | |
1128 ;; | |
1129 ;; This will convert the composing glyphs (2 column glyphs) | |
1130 ;; to narrow (1 column) glyphs if they exist. | |
1131 ;; | |
1132 ;; devanagari-wide-to-narrow-old converts glyphs simply. | |
1133 ;; devanagari-wide-to-narrow takes care of upper/lower apply-glyphs | |
1134 ;; with 2 column base-glyph. | |
1135 ;; | |
1136 ;; Execution Examples | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1137 ;;(devanagari-wide-to-narrow '(?$(5!3(B (ml . ml) ?$(5!a(B)) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1138 ;;(devanagari-wide-to-narrow '(?$(5!F(B (ml . ml) ?$(5!a(B)) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1139 |
17052 | 1140 (defun devanagari-wide-to-narrow (src-list) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1141 (devanagari-wide-to-narrow-iter src-list t)) |
17052 | 1142 |
21442 | 1143 (defun devanagari-wide-to-narrow-iter (src-list 2-col-glyph) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1144 (let ((glyph (car src-list))) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1145 (cond ((null src-list) '()) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1146 ; not glyph code |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1147 ((not (numberp glyph)) |
26894 | 1148 (cons glyph |
1149 (devanagari-wide-to-narrow-iter (cdr src-list) 2-col-glyph))) | |
21442 | 1150 ; glyphs to be processed regardless of the value of "2-col-glyph" |
1151 ((devanagari-non-vertical-modifier-p glyph) | |
1152 (cons (devanagari-wide-to-narrow-char glyph) | |
1153 (devanagari-wide-to-narrow-iter (cdr src-list) 2-col-glyph))) | |
1154 ; glyphs which are depends on the value of "2-col-glyph" | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1155 ((devanagari-vertical-modifier-p glyph) |
21442 | 1156 (if 2-col-glyph |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1157 (cons glyph |
21442 | 1158 (devanagari-wide-to-narrow-iter (cdr src-list) t)) |
1159 (cons (devanagari-wide-to-narrow-char glyph) | |
26894 | 1160 (devanagari-wide-to-narrow-iter (cdr src-list) |
1161 2-col-glyph)))) | |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1162 ; normal glyph |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1163 (t |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1164 (if (cdr (assq glyph devanagari-1-column-char)) |
21442 | 1165 (cons (devanagari-wide-to-narrow-char glyph) |
17087
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1166 (devanagari-wide-to-narrow-iter (cdr src-list) nil)) |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1167 (cons glyph |
fb13faeea9aa
Fix handling of several characters.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
1168 (devanagari-wide-to-narrow-iter (cdr src-list) t))))))) |
17052 | 1169 |
1170 | |
1171 ;; | |
1172 ;; Summary | |
1173 ;; | |
1174 | |
1175 ;; | |
26894 | 1176 ;; Decomposition of composite sequence. |
17052 | 1177 ;; |
1178 | |
1179 ;;;###autoload | |
1180 (defun devanagari-decompose-string (str) | |
26894 | 1181 "Decompose Devanagari string STR" |
1182 (decompose-string (copy-sequence str))) | |
17052 | 1183 |
1184 ;;;###autoload | |
1185 (defun devanagari-decompose-region (from to) | |
1186 (interactive "r") | |
26894 | 1187 (decompose-region from to)) |
17052 | 1188 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1189 ;;; |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1190 ;;; Composition |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1191 ;;; |
17052 | 1192 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1193 ;;;###autoload |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1194 (defun devanagari-compose-string (str &rest langs) |
26894 | 1195 (setq str (copy-sequence str)) |
1196 (let ((idx 0) | |
1197 rest match-b match-e) | |
1198 (while (string-match devanagari-composite-glyph-unit str idx) | |
1199 (let* ((match-b (match-beginning 0)) | |
1200 (match-e (match-end 0)) | |
1201 (cmps (devanagari-composition-component | |
1202 (apply | |
1203 'char-to-glyph-devanagari | |
1204 (cons (substring str match-b match-e) langs))))) | |
1205 (compose-string str match-b match-e cmps) | |
1206 (setq idx match-e)))) | |
1207 str) | |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1208 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1209 ;;;###autoload |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1210 (defun devanagari-compose-region (from to &rest langs) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1211 (interactive "r") |
26894 | 1212 (save-excursion |
1213 (save-restriction | |
1214 (narrow-to-region from to) | |
1215 (goto-char (point-min)) | |
1216 (while (re-search-forward devanagari-composite-glyph-unit nil t) | |
1217 (let* ((match-b (match-beginning 0)) (match-e (match-end 0)) | |
1218 (cmps (devanagari-composition-component | |
1219 (apply | |
1220 'char-to-glyph-devanagari | |
1221 (cons (buffer-substring match-b match-e) langs))))) | |
1222 (compose-region match-b match-e cmps)))))) | |
17052 | 1223 |
1224 ;; For pre-write and post-read conversion | |
1225 | |
1226 ;;;###autoload | |
1227 (defun devanagari-compose-from-is13194-region (from to) | |
1228 "Compose IS 13194 characters in the region to Devanagari characters." | |
1229 (interactive "r") | |
20111
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1230 (save-excursion |
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1231 (save-restriction |
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1232 (narrow-to-region from to) |
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1233 (indian-to-devanagari-region (point-min) (point-max)) |
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1234 (devanagari-compose-region (point-min) (point-max)) |
761a83f7cb4e
(devanagari-compose-from-is13194-region):
Kenichi Handa <handa@m17n.org>
parents:
18547
diff
changeset
|
1235 (- (point-max) (point-min))))) |
17052 | 1236 |
1237 ;;;###autoload | |
17773
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1238 (defun in-is13194-devanagari-post-read-conversion (len) |
26894 | 1239 (let ((pos (point))) |
1240 (devanagari-compose-from-is13194-region pos (+ pos len)))) | |
17773
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1241 |
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1242 ;;;###autoload |
17052 | 1243 (defun devanagari-decompose-to-is13194-region (from to) |
1244 "Decompose Devanagari characters in the region to IS 13194 characters." | |
1245 (interactive "r") | |
26894 | 1246 (save-excursion |
1247 (save-restriction | |
1248 (narrow-to-region from to) | |
1249 (devanagari-decompose-region (point-min) (point-max)) | |
1250 (devanagari-to-indian-region (point-min) (point-max))))) | |
17052 | 1251 |
17773
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1252 ;;;###autoload |
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1253 (defun in-is13194-devanagari-pre-write-conversion (from to) |
23525
7462da3c79cb
(in-is13194-devanagari-pre-write-conversion): Use with-temp-buffer.
Kenichi Handa <handa@m17n.org>
parents:
22987
diff
changeset
|
1254 (let ((old-buf (current-buffer))) |
23548
87736ae8e5ff
(in-is13194-devanagari-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23525
diff
changeset
|
1255 (set-buffer (generate-new-buffer " *temp*")) |
87736ae8e5ff
(in-is13194-devanagari-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23525
diff
changeset
|
1256 (if (stringp from) |
87736ae8e5ff
(in-is13194-devanagari-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23525
diff
changeset
|
1257 (insert from) |
87736ae8e5ff
(in-is13194-devanagari-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23525
diff
changeset
|
1258 (insert-buffer-substring old-buf from to)) |
87736ae8e5ff
(in-is13194-devanagari-pre-write-conversion): Cancel previous
Kenichi Handa <handa@m17n.org>
parents:
23525
diff
changeset
|
1259 (devanagari-decompose-to-is13194-region (point-min) (point-max)) |
17773
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1260 ;; Should return nil as annotations. |
f1ece95d00c2
(in-is13194-devanagari-post-read-conversion): New function.
Kenichi Handa <handa@m17n.org>
parents:
17314
diff
changeset
|
1261 nil)) |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1262 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1263 ;; For input/output of ITRANS |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1264 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1265 ;;;###autoload |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1266 (defun devanagari-encode-itrans-region (from to) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1267 (interactive "r") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1268 (save-restriction |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1269 (narrow-to-region from to) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1270 (devanagari-decompose-to-is13194-region (point-min) (point-max)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1271 (indian-encode-itrans-region (point-min) (point-max)))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1272 |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1273 ;;;###autoload |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1274 (defun devanagari-decode-itrans-region (from to) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1275 (interactive "r") |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1276 (save-restriction |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1277 (narrow-to-region from to) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1278 (indian-decode-itrans-region (point-min) (point-max)) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1279 (devanagari-compose-from-is13194-region (point-min) (point-max)))) |
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1280 |
17052 | 1281 ;; |
18309
bd8b521f5218
Provide XXX-util instead of
Kenichi Handa <handa@m17n.org>
parents:
18203
diff
changeset
|
1282 (provide 'devan-util) |
17052 | 1283 |
17300
01d528c5dd18
Handle more Devanagari characters correctly.
Kenichi Handa <handa@m17n.org>
parents:
17087
diff
changeset
|
1284 ;;; devan-util.el end here |
36680
0c75fe9804e2
Add coding: tag in Local Variables: section.
Kenichi Handa <handa@m17n.org>
parents:
31446
diff
changeset
|
1285 |
0c75fe9804e2
Add coding: tag in Local Variables: section.
Kenichi Handa <handa@m17n.org>
parents:
31446
diff
changeset
|
1286 ;; Local Variables: |
0c75fe9804e2
Add coding: tag in Local Variables: section.
Kenichi Handa <handa@m17n.org>
parents:
31446
diff
changeset
|
1287 ;; coding: iso-2022-7bit |
0c75fe9804e2
Add coding: tag in Local Variables: section.
Kenichi Handa <handa@m17n.org>
parents:
31446
diff
changeset
|
1288 ;; End: |