comparison lisp/language/indian.el @ 107925:d95939738dba

Fix previous change of *-composable-pattern.
author Kenichi Handa <handa@etlken>
date Wed, 07 Apr 2010 15:09:33 +0900
parents 64dd8cad5b43
children 6a2e327273fe
comparison
equal deleted inserted replaced
107920:6ab7fa5331f8 107925:d95939738dba
239 (indian-compose-regexp 239 (indian-compose-regexp
240 (concat 240 (concat
241 ;; syllables with an independent vowel, or 241 ;; syllables with an independent vowel, or
242 "\\(?:RH\\)?Vn?\\(?:J?HR\\)?v*n?a?A?\\|" 242 "\\(?:RH\\)?Vn?\\(?:J?HR\\)?v*n?a?A?\\|"
243 ;; consonant-based syllables, or 243 ;; consonant-based syllables, or
244 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?|v*n?a?A?\\)\\|" 244 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?\\|v*n?a?A?\\)\\|"
245 ;; special consonant form, or 245 ;; special consonant form, or
246 "JHR\\|" 246 "JHR\\|"
247 ;; any other singleton characters 247 ;; any other singleton characters
248 "X") 248 "X")
249 table)) 249 table))
254 '(("a" . "\u0B01") ; SIGN CANDRABINDU 254 '(("a" . "\u0B01") ; SIGN CANDRABINDU
255 ("A" . "[\u0B02-\u0B03]") ; SIGN ANUSVARA .. VISARGA 255 ("A" . "[\u0B02-\u0B03]") ; SIGN ANUSVARA .. VISARGA
256 ("V" . "[\u0B05-\u0B14\u0B60-\u0B61]") ; independent vowel 256 ("V" . "[\u0B05-\u0B14\u0B60-\u0B61]") ; independent vowel
257 ("C" . "[\u0B15-\u0B39\u0B5C-\u0B5D\u0B71]") ; consonant 257 ("C" . "[\u0B15-\u0B39\u0B5C-\u0B5D\u0B71]") ; consonant
258 ("B" . "[\u0B15-\u0B17\u0B1B-\u0B1D\u0B1F-\u0B21\u0B23-\u0B24\u0B27-\u0B30\u0B32-\u0B35\u0B38-\u0B39]") ; consonant with below form 258 ("B" . "[\u0B15-\u0B17\u0B1B-\u0B1D\u0B1F-\u0B21\u0B23-\u0B24\u0B27-\u0B30\u0B32-\u0B35\u0B38-\u0B39]") ; consonant with below form
259 ("R" . "\u0B30") ; RA
259 ("n" . "\u0B3C") ; NUKTA 260 ("n" . "\u0B3C") ; NUKTA
260 ("v" . "[\u0B3E-\u0B44\u0B56-\u0B57\u0B62-\u0B63]") ; vowel sign 261 ("v" . "[\u0B3E-\u0B44\u0B47\u0B56-\u0B57\u0B62-\u0B63]") ; vowel sign
261 ("H" . "\u0B4D") ; VIRAMA 262 ("H" . "\u0B4D") ; VIRAMA
262 ("N" . "\u200C") ; ZWNJ 263 ("N" . "\u200C") ; ZWNJ
263 ("J" . "\u200D") ; ZWJ 264 ("J" . "\u200D") ; ZWJ
264 ("X" . "[\u0B00-\u0B7F]")))) ; all coverage 265 ("X" . "[\u0B00-\u0B7F]")))) ; all coverage
265 (indian-compose-regexp 266 (indian-compose-regexp
266 (concat 267 (concat
267 ;; syllables with an independent vowel, or 268 ;; syllables with an independent vowel, or
268 "\\(?:RH\\)?Vn?\\(?:J?HB\\)?v*n?a?A?\\|" 269 "\\(?:RH\\)?Vn?\\(?:J?HB\\)?v*n?a?A?\\|"
269 ;; consonant-based syllables, or 270 ;; consonant-based syllables, or
270 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?|v*n?a?A?\\)\\|" 271 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?\\|v*n?a?A?\\)\\|"
271 ;; special consonant form, or 272 ;; special consonant form, or
272 "JHB\\|" 273 "JHB\\|"
273 ;; any other singleton characters 274 ;; any other singleton characters
274 "X") 275 "X")
275 table)) 276 table))
286 ("J" . "\u200D") ; ZWJ 287 ("J" . "\u200D") ; ZWJ
287 ("X" . "[\u0B80-\u0BFF]")))) ; all coverage 288 ("X" . "[\u0B80-\u0BFF]")))) ; all coverage
288 (indian-compose-regexp 289 (indian-compose-regexp
289 (concat 290 (concat
290 ;; consonant-based syllables, or 291 ;; consonant-based syllables, or
291 "C\\(?:J?HJ?C\\)*\\(?:H[NJ]?|v*a?\\)\\|" 292 "C\\(?:J?HJ?C\\)*\\(?:H[NJ]?\\|v*a?\\)\\|"
292 ;; syllables with an independent vowel, or 293 ;; syllables with an independent vowel, or
293 "Vv*a?\\|" 294 "Vv*a?\\|"
294 ;; any other singleton characters 295 ;; any other singleton characters
295 "X") 296 "X")
296 table)) 297 table))
300 (let ((table 301 (let ((table
301 '(("a" . "[\u0C01-\u0C03]") ; SIGN CANDRABINDU .. VISARGA 302 '(("a" . "[\u0C01-\u0C03]") ; SIGN CANDRABINDU .. VISARGA
302 ("V" . "[\u0C05-\u0C14\u0C60-\u0C61]") ; independent vowel 303 ("V" . "[\u0C05-\u0C14\u0C60-\u0C61]") ; independent vowel
303 ("C" . "[\u0C15-\u0C39\u0C58-\u0C59]") ; consonant 304 ("C" . "[\u0C15-\u0C39\u0C58-\u0C59]") ; consonant
304 ("v" . "[\u0C3E-\u0C4C\u0C55-\u0C56\u0C62-\u0C63]") ; vowel sign 305 ("v" . "[\u0C3E-\u0C4C\u0C55-\u0C56\u0C62-\u0C63]") ; vowel sign
305 ("H" . "\u0BCD") ; VIRAMA 306 ("H" . "\u0C4D") ; VIRAMA
306 ("N" . "\u200C") ; ZWNJ 307 ("N" . "\u200C") ; ZWNJ
307 ("J" . "\u200D") ; ZWJ 308 ("J" . "\u200D") ; ZWJ
308 ("X" . "[\u0C00-\u0C7F]")))) ; all coverage 309 ("X" . "[\u0C00-\u0C7F]")))) ; all coverage
309 (indian-compose-regexp 310 (indian-compose-regexp
310 (concat 311 (concat
311 ;; consonant-based syllables, or 312 ;; consonant-based syllables, or
312 "C\\(?:J?HJ?C\\)*\\(?:H[NJ]?|v*a?\\)\\|" 313 "C\\(?:J?HJ?C\\)*\\(?:H[NJ]?\\|v*a?\\)\\|"
313 ;; syllables with an independent vowel, or 314 ;; syllables with an independent vowel, or
314 "V\\(?:J?HC\\)?v*a?\\|" 315 "V\\(?:J?HC\\)?v*a?\\|"
315 ;; special consonant form, or 316 ;; special consonant form, or
316 "JHC\\|" 317 "JHC\\|"
317 ;; any other singleton characters 318 ;; any other singleton characters
322 (defconst kannada-composable-pattern 323 (defconst kannada-composable-pattern
323 (let ((table 324 (let ((table
324 '(("A" . "[\u0C82-\u0C83]") ; SIGN ANUSVARA .. VISARGA 325 '(("A" . "[\u0C82-\u0C83]") ; SIGN ANUSVARA .. VISARGA
325 ("V" . "[\u0C85-\u0C94\u0CE0-\u0CE1]") ; independent vowel 326 ("V" . "[\u0C85-\u0C94\u0CE0-\u0CE1]") ; independent vowel
326 ("C" . "[\u0C95-\u0CB9\u0CDE]") ; consonant 327 ("C" . "[\u0C95-\u0CB9\u0CDE]") ; consonant
327 ("B" . "\u0CB0") ; RA 328 ("R" . "\u0CB0") ; RA
328 ("n" . "\u0CBC") ; NUKTA 329 ("n" . "\u0CBC") ; NUKTA
329 ("v" . "[\u0CBE-\u0CCC\u0CD5-\u0CD6\u0CE2-\u0CE3]") ; vowel sign 330 ("v" . "[\u0CBE-\u0CCC\u0CD5-\u0CD6\u0CE2-\u0CE3]") ; vowel sign
330 ("H" . "\u0CCD") ; VIRAMA 331 ("H" . "\u0CCD") ; VIRAMA
331 ("N" . "\u200C") ; ZWNJ 332 ("N" . "\u200C") ; ZWNJ
332 ("J" . "\u200D") ; ZWJ 333 ("J" . "\u200D") ; ZWJ
334 (indian-compose-regexp 335 (indian-compose-regexp
335 (concat 336 (concat
336 ;; syllables with an independent vowel, or 337 ;; syllables with an independent vowel, or
337 "\\(?:RH\\)?Vn?\\(?:J?HC\\)?v?A?\\|" 338 "\\(?:RH\\)?Vn?\\(?:J?HC\\)?v?A?\\|"
338 ;; consonant-based syllables, or 339 ;; consonant-based syllables, or
339 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?|v*n?A?\\)\\|" 340 "Cn?\\(?:J?HJ?Cn?\\)*\\(?:H[NJ]?\\|v*n?A?\\)\\|"
340 ;; special consonant form, or 341 ;; special consonant form, or
341 "JHB\\|" 342 "JHC\\|"
342 ;; any other singleton characters 343 ;; any other singleton characters
343 "X") 344 "X")
344 table)) 345 table))
345 "Regexp matching a composable sequence of Kannada characters.") 346 "Regexp matching a composable sequence of Kannada characters.")
346 347
349 '(("A" . "[\u0D02-\u0D03]") ; SIGN ANUSVARA .. VISARGA 350 '(("A" . "[\u0D02-\u0D03]") ; SIGN ANUSVARA .. VISARGA
350 ("V" . "[\u0D05-\u0D14\u0D60-\u0D61]") ; independent vowel 351 ("V" . "[\u0D05-\u0D14\u0D60-\u0D61]") ; independent vowel
351 ("C" . "[\u0D15-\u0D39]") ; consonant 352 ("C" . "[\u0D15-\u0D39]") ; consonant
352 ("Y" . "[\u0D2F-\u0D30\u0D32\u0D35]") ; YA, RA, LA, VA 353 ("Y" . "[\u0D2F-\u0D30\u0D32\u0D35]") ; YA, RA, LA, VA
353 ("v" . "[\u0D3E-\u0D48\u0D57\u0D62-\u0D63]") ; postbase matra 354 ("v" . "[\u0D3E-\u0D48\u0D57\u0D62-\u0D63]") ; postbase matra
355 ("H" . "\u0D4D") ; SIGN VIRAMA
354 ("N" . "\u200C") ; ZWNJ 356 ("N" . "\u200C") ; ZWNJ
355 ("J" . "\u200D") ; ZWJ 357 ("J" . "\u200D") ; ZWJ
356 ("X" . "[\u0D00-\u0D7F]")))) ; all coverage 358 ("X" . "[\u0D00-\u0D7F]")))) ; all coverage
357 (indian-compose-regexp 359 (indian-compose-regexp
358 (concat 360 (concat
359 ;; consonant-based syllables, or 361 ;; consonant-based syllables, or
360 "\\(?:CJ?HJ?C\\)*\\(?:H[NJ]?\\|v?A?\\)\\|" 362 "C\\(?:J?HJ?C\\)*\\(?:H[NJ]?\\|v?A?\\)\\|"
361 ;; syllables with an independent vowel, or 363 ;; syllables with an independent vowel, or
362 "V\\(?:J?HY\\)?v*?A?\\|" 364 "V\\(?:J?HY\\)?v*?A?\\|"
363 ;; special consonant form, or 365 ;; special consonant form, or
364 "JHY\\|" 366 "JHY\\|"
365 ;; any other singleton characters 367 ;; any other singleton characters