annotate src/character.c @ 88387:06da178fab0e

* regex.c: Include "character.h" instead of "charset.h". (BYTE8_TO_CHAR, CHAR_BYTE8_P) [not emacs]: New dummy macros. (regex_compile): Accept a range whose starting and ending character have different leading bytes. (analyse_first): Adjusted for the above change.
author Kenichi Handa <handa@m17n.org>
date Fri, 01 Mar 2002 01:46:12 +0000
parents 13b9026422e0
children 1a3aec316071
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1 /* Basic character support.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
2 Copyright (C) 1995, 1997, 1998, 2001 Electrotechnical Laboratory, JAPAN.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
3 Licensed to the Free Software Foundation.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
4 Copyright (C) 2001 Free Software Foundation, Inc.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
5 Copyright (C) 2001, 2002
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
7 Registration Number H13PRO009
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
8
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
9 This file is part of GNU Emacs.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
10
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
11 GNU Emacs is free software; you can redistribute it and/or modify
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
12 it under the terms of the GNU General Public License as published by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
13 the Free Software Foundation; either version 2, or (at your option)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
14 any later version.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
15
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
16 GNU Emacs is distributed in the hope that it will be useful,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
17 but WITHOUT ANY WARRANTY; without even the implied warranty of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
18 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
19 GNU General Public License for more details.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
20
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
21 You should have received a copy of the GNU General Public License
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
22 along with GNU Emacs; see the file COPYING. If not, write to
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
23 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
24 Boston, MA 02111-1307, USA. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
25
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
26 /* At first, see the document in `character.h' to understand the code
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
27 in this file. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
28
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
29 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
30 #include <config.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
31 #endif
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
32
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
33 #include <stdio.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
34
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
35 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
36
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
37 #include <sys/types.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
38 #include "lisp.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
39 #include "character.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
40 #include "buffer.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
41 #include "charset.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
42 #include "composite.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
43 #include "disptab.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
44
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
45 #else /* not emacs */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
46
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
47 #include "mulelib.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
48
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
49 #endif /* emacs */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
50
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
51 Lisp_Object Qcharacterp;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
52
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
53 /* Vector of translation table ever defined.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
54 ID of a translation table is used to index this vector. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
55 Lisp_Object Vtranslation_table_vector;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
56
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
57 /* A char-table for characters which may invoke auto-filling. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
58 Lisp_Object Vauto_fill_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
59
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
60 Lisp_Object Qauto_fill_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
61
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
62 Lisp_Object Vchar_unify_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
63
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
64 /* A char-table. An element is non-nil iff the corresponding
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
65 character has a printable glyph. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
66 Lisp_Object Vprintable_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
67
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
68 /* A char-table. An elemnent is a column-width of the corresponding
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
69 character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
70 Lisp_Object Vchar_width_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
71
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
72 /* A char-table. An element is a symbol indicating the direction
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
73 property of corresponding character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
74 Lisp_Object Vchar_direction_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
75
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
76 /* Variables used locally in the macro FETCH_MULTIBYTE_CHAR. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
77 unsigned char *_fetch_multibyte_char_p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
78 int _fetch_multibyte_char_len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
79
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
80
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
81
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
82 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
83 char_string_with_unification (c, p, advanced)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
84 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
85 unsigned char *p, **advanced;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
86 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
87 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
88
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
89 MAYBE_UNIFY_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
90
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
91 if (c <= MAX_3_BYTE_CHAR || c > MAX_5_BYTE_CHAR)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
92 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
93 bytes = CHAR_STRING (c, p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
94 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
95 else if (c <= MAX_4_BYTE_CHAR)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
96 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
97 p[0] = (0xF0 | (c >> 18));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
98 p[1] = (0x80 | ((c >> 12) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
99 p[2] = (0x80 | ((c >> 6) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
100 p[3] = (0x80 | (c & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
101 bytes = 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
102 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
103 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
104 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
105 p[0] = 0xF8;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
106 p[1] = (0x80 | ((c >> 18) & 0x0F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
107 p[2] = (0x80 | ((c >> 12) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
108 p[3] = (0x80 | ((c >> 6) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
109 p[4] = (0x80 | (c & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
110 bytes = 5;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
111 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
112 if (advanced)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
113 *advanced = p + bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
114 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
115 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
116
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
117
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
118 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
119 string_char_with_unification (p, advanced, len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
120 unsigned char *p, **advanced;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
121 int *len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
122 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
123 int c, unified;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
124 unsigned char *saved_p = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
125
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
126 if (*p < 0x80 || ! (*p & 0x20) || ! (*p & 0x10))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
127 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
128 c = STRING_CHAR_ADVANCE (p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
129 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
130 else if (! (*p & 0x08))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
131 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
132 c = ((((p)[0] & 0xF) << 18)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
133 | (((p)[1] & 0x3F) << 12)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
134 | (((p)[2] & 0x3F) << 6)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
135 | ((p)[3] & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
136 p += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
137 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
138 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
139 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
140 c = ((((p)[1] & 0x3F) << 18)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
141 | (((p)[2] & 0x3F) << 12)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
142 | (((p)[3] & 0x3F) << 6)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
143 | ((p)[4] & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
144 p += 5;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
145 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
146
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
147 MAYBE_UNIFY_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
148
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
149 if (len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
150 *len = p - saved_p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
151 if (advanced)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
152 *advanced = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
153 return c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
154 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
155
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
156
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
157 /* Translate character C by translation table TABLE. If C is
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
158 negative, translate a character specified by CHARSET and CODE. If
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
159 no translation is found in TABLE, return the untranslated
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
160 character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
161
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
162 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
163 translate_char (table, c)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
164 Lisp_Object table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
165 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
166 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
167 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
168
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
169 if (! CHAR_TABLE_P (table))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
170 return c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
171 ch = CHAR_TABLE_REF (table, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
172 if (! CHARACTERP (ch))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
173 return c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
174 return XINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
175 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
176
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
177 /* Convert the unibyte character C to the corresponding multibyte
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
178 character based on the current value of charset_primary. If C
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
179 can't be converted, return C. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
180
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
181 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
182 unibyte_char_to_multibyte (c)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
183 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
184 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
185 struct charset *charset = CHARSET_FROM_ID (charset_primary);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
186 int c1 = DECODE_CHAR (charset, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
187
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
188 return ((c1 >= 0) ? c1 : c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
189 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
190
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
191
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
192 /* Convert the multibyte character C to unibyte 8-bit character based
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
193 on the current value of charset_primary. If dimension of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
194 charset_primary is more than one, return (C & 0xFF).
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
195
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
196 The argument REV_TBL is now ignored. It will be removed in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
197 future. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
198
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
199 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
200 multibyte_char_to_unibyte (c, rev_tbl)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
201 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
202 Lisp_Object rev_tbl;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
203 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
204 struct charset *charset = CHARSET_FROM_ID (charset_primary);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
205 unsigned c1 = ENCODE_CHAR (charset, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
206
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
207 return ((c1 != CHARSET_INVALID_CODE (charset)) ? c1 : c & 0xFF);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
208 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
209
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
210
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
211 DEFUN ("characterp", Fcharacterp, Scharacterp, 1, 2, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
212 doc: /* Return non-nil if OBJECT is a character. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
213 (object, ignore)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
214 Lisp_Object object, ignore;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
215 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
216 return (CHARACTERP (object) ? Qt : Qnil);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
217 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
218
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
219 DEFUN ("max-char", Fmax_char, Smax_char, 0, 0, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
220 doc: /* Return the character of the maximum code. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
221 ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
222 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
223 return make_number (MAX_CHAR);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
224 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
225
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
226 DEFUN ("unibyte-char-to-multibyte", Funibyte_char_to_multibyte,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
227 Sunibyte_char_to_multibyte, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
228 doc: /* Convert the unibyte character CH to multibyte character.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
229 The multibyte character is a result of decoding CH by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
230 the current primary charset (value of `charset-primary'). */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
231 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
232 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
233 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
234 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
235 struct charset *charset;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
236
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
237 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
238 c = XFASTINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
239 if (c >= 0400)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
240 error ("Invalid unibyte character: %d", c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
241 charset = CHARSET_FROM_ID (charset_primary);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
242 c = DECODE_CHAR (charset, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
243 if (c < 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
244 error ("Can't convert to multibyte character: %d", XINT (ch));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
245 return make_number (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
246 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
247
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
248 DEFUN ("multibyte-char-to-unibyte", Fmultibyte_char_to_unibyte,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
249 Smultibyte_char_to_unibyte, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
250 doc: /* Convert the multibyte character CH to unibyte character.\n\
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
251 The unibyte character is a result of encoding CH by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
252 the current primary charset (value of `charset-primary'). */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
253 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
254 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
255 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
256 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
257 unsigned code;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
258 struct charset *charset;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
259
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
260 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
261 c = XFASTINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
262 charset = CHARSET_FROM_ID (charset_primary);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
263 code = ENCODE_CHAR (charset, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
264 if (code < CHARSET_MIN_CODE (charset)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
265 || code > CHARSET_MAX_CODE (charset))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
266 error ("Can't convert to unibyte character: %d", XINT (ch));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
267 return make_number (code);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
268 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
269
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
270 DEFUN ("char-bytes", Fchar_bytes, Schar_bytes, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
271 doc: /* Return 1 regardless of the argument CHAR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
272 This is now an obsolete function. We keep it just for backward compatibility. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
273 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
274 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
275 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
276 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
277 return make_number (1);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
278 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
279
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
280 DEFUN ("char-width", Fchar_width, Schar_width, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
281 doc: /* Return width of CHAR when displayed in the current buffer.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
282 The width is measured by how many columns it occupies on the screen.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
283 Tab is taken to occupy `tab-width' columns. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
284 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
285 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
286 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
287 Lisp_Object disp;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
288 int c, width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
289 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
290
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
291 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
292 c = XINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
293
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
294 /* Get the way the display table would display it. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
295 disp = dp ? DISP_CHAR_VECTOR (dp, c) : Qnil;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
296
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
297 if (VECTORP (disp))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
298 width = ASIZE (disp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
299 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
300 width = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
301
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
302 return make_number (width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
303 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
304
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
305 /* Return width of string STR of length LEN when displayed in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
306 current buffer. The width is measured by how many columns it
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
307 occupies on the screen. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
308
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
309 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
310 strwidth (str, len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
311 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
312 int len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
313 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
314 return c_string_width (str, len, -1, NULL, NULL);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
315 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
316
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
317 /* Return width of string STR of length LEN when displayed in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
318 current buffer. The width is measured by how many columns it
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
319 occupies on the screen. If PRECISION > 0, return the width of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
320 longest substring that doesn't exceed PRECISION, and set number of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
321 characters and bytes of the substring in *NCHARS and *NBYTES
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
322 respectively. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
323
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
324 c_string_width (str, len, precision, nchars, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
325 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
326 int precision, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
327 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
328 int i = 0, i_byte = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
329 int width = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
330 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
331
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
332 while (i_byte < len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
333 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
334 int bytes, thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
335 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
336 int c = STRING_CHAR_AND_LENGTH (str + i_byte, len - i_byte, bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
337
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
338 if (dp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
339 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
340 val = DISP_CHAR_VECTOR (dp, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
341 if (VECTORP (val))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
342 thiswidth = XVECTOR (val)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
343 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
344 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
345 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
346 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
347 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
348 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
349 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
350
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
351 if (precision > 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
352 && (width + thiswidth > precision))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
353 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
354 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
355 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
356 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
357 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
358 i++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
359 i_byte += bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
360 width += thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
361 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
362
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
363 if (precision > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
364 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
365 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
366 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
367 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
368
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
369 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
370 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
371
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
372 /* Return width of Lisp string STRING when displayed in the current
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
373 buffer. The width is measured by how many columns it occupies on
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
374 the screen while paying attention to compositions. If PRECISION >
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
375 0, return the width of longest substring that doesn't exceed
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
376 PRECISION, and set number of characters and bytes of the substring
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
377 in *NCHARS and *NBYTES respectively. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
378
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
379 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
380 lisp_string_width (string, precision, nchars, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
381 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
382 int precision, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
383 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
384 int len = XSTRING (string)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
385 int len_byte = STRING_BYTES (XSTRING (string));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
386 unsigned char *str = XSTRING (string)->data;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
387 int i = 0, i_byte = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
388 int width = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
389 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
390
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
391 while (i < len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
392 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
393 int chars, bytes, thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
394 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
395 int cmp_id;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
396 int ignore, end;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
397
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
398 if (find_composition (i, -1, &ignore, &end, &val, string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
399 && ((cmp_id = get_composition_id (i, i_byte, end - i, val, string))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
400 >= 0))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
401 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
402 thiswidth = composition_table[cmp_id]->width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
403 chars = end - i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
404 bytes = string_char_to_byte (string, end) - i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
405 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
406 else if (dp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
407 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
408 int c = STRING_CHAR_AND_LENGTH (str + i_byte, len - i_byte, bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
409
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
410 chars = 1;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
411 val = DISP_CHAR_VECTOR (dp, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
412 if (VECTORP (val))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
413 thiswidth = XVECTOR (val)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
414 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
415 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
416 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
417 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
418 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
419 int c = STRING_CHAR_AND_LENGTH (str + i_byte, len - i_byte, bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
420
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
421 chars = 1;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
422 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
423 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
424
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
425 if (precision > 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
426 && (width + thiswidth > precision))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
427 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
428 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
429 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
430 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
431 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
432 i += chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
433 i_byte += bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
434 width += thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
435 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
436
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
437 if (precision > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
438 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
439 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
440 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
441 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
442
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
443 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
444 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
445
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
446 DEFUN ("string-width", Fstring_width, Sstring_width, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
447 doc: /* Return width of STRING when displayed in the current buffer.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
448 Width is measured by how many columns it occupies on the screen.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
449 When calculating width of a multibyte character in STRING,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
450 only the base leading-code is considered; the validity of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
451 the following bytes is not checked. Tabs in STRING are always
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
452 taken to occupy `tab-width' columns. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
453 (str)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
454 Lisp_Object str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
455 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
456 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
457
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
458 CHECK_STRING (str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
459 XSETFASTINT (val, lisp_string_width (str, -1, NULL, NULL));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
460 return val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
461 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
462
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
463 DEFUN ("char-direction", Fchar_direction, Schar_direction, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
464 doc: /* Return the direction of CHAR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
465 The returned value is 0 for left-to-right and 1 for right-to-left. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
466 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
467 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
468 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
469 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
470
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
471 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
472 c = XINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
473 return CHAR_TABLE_REF (Vchar_direction_table, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
474 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
475
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
476 DEFUN ("chars-in-region", Fchars_in_region, Schars_in_region, 2, 2, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
477 doc: /* Return number of characters between BEG and END.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
478 This is now an obsolete function. We keep it just for backward compatibility. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
479 (beg, end)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
480 Lisp_Object beg, end;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
481 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
482 int from, to;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
483
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
484 CHECK_NUMBER_COERCE_MARKER (beg);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
485 CHECK_NUMBER_COERCE_MARKER (end);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
486
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
487 from = min (XFASTINT (beg), XFASTINT (end));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
488 to = max (XFASTINT (beg), XFASTINT (end));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
489
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
490 return make_number (to - from);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
491 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
492
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
493 /* Return the number of characters in the NBYTES bytes at PTR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
494 This works by looking at the contents and checking for multibyte
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
495 sequences while assuming that there's no invalid sequence.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
496 However, if the current buffer has enable-multibyte-characters =
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
497 nil, we treat each byte as a character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
498
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
499 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
500 chars_in_text (ptr, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
501 unsigned char *ptr;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
502 int nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
503 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
504 /* current_buffer is null at early stages of Emacs initialization. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
505 if (current_buffer == 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
506 || NILP (current_buffer->enable_multibyte_characters))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
507 return nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
508
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
509 return multibyte_chars_in_text (ptr, nbytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
510 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
511
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
512 /* Return the number of characters in the NBYTES bytes at PTR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
513 This works by looking at the contents and checking for multibyte
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
514 sequences while assuming that there's no invalid sequence. It
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
515 ignores enable-multibyte-characters. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
516
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
517 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
518 multibyte_chars_in_text (ptr, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
519 unsigned char *ptr;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
520 int nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
521 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
522 unsigned char *endp = ptr + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
523 int chars = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
524
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
525 while (ptr < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
526 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
527 int len = MULTIBYTE_LENGTH (ptr, endp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
528
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
529 if (len == 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
530 abort ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
531 ptr += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
532 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
533 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
534
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
535 return chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
536 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
537
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
538 /* Parse unibyte text at STR of LEN bytes as a multibyte text, count
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
539 characters and bytes in it, and store them in *NCHARS and *NBYTES
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
540 respectively. On counting bytes, pay attention to that 8-bit
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
541 characters not constructing a valid multibyte sequence are
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
542 represented by 2-byte in a multibyte text. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
543
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
544 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
545 parse_str_as_multibyte (str, len, nchars, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
546 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
547 int len, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
548 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
549 unsigned char *endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
550 int n, chars = 0, bytes = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
551
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
552 if (len >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
553 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
554 unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
555 while (str < adjusted_endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
556 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
557 if ((n = MULTIBYTE_LENGTH_NO_CHECK (str)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
558 str += n, bytes += n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
559 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
560 str++, bytes += 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
561 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
562 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
563 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
564 while (str < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
565 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
566 if ((n = MULTIBYTE_LENGTH (str, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
567 str += n, bytes += n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
568 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
569 str++, bytes += 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
570 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
571 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
572
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
573 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
574 *nbytes = bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
575 return;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
576 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
577
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
578 /* Arrange unibyte text at STR of NBYTES bytes as a multibyte text.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
579 It actually converts only such 8-bit characters that don't contruct
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
580 a multibyte sequence to multibyte forms of Latin-1 characters. If
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
581 NCHARS is nonzero, set *NCHARS to the number of characters in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
582 text. It is assured that we can use LEN bytes at STR as a work
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
583 area and that is enough. Return the number of bytes of the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
584 resulting text. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
585
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
586 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
587 str_as_multibyte (str, len, nbytes, nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
588 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
589 int len, nbytes, *nchars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
590 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
591 unsigned char *p = str, *endp = str + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
592 unsigned char *to;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
593 int chars = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
594 int n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
595
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
596 if (nbytes >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
597 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
598 unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
599 while (p < adjusted_endp
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
600 && (n = MULTIBYTE_LENGTH_NO_CHECK (p)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
601 p += n, chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
602 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
603 while ((n = MULTIBYTE_LENGTH (p, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
604 p += n, chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
605 if (nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
606 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
607 if (p == endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
608 return nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
609
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
610 to = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
611 nbytes = endp - p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
612 endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
613 safe_bcopy ((char *) p, (char *) (endp - nbytes), nbytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
614 p = endp - nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
615
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
616 if (nbytes >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
617 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
618 unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
619 while (p < adjusted_endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
620 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
621 if ((n = MULTIBYTE_LENGTH_NO_CHECK (p)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
622 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
623 while (n--)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
624 *to++ = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
625 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
626 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
627 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
628 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
629 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
630 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
631 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
632 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
633 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
634 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
635 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
636 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
637 if ((n = MULTIBYTE_LENGTH (p, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
638 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
639 while (n--)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
640 *to++ = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
641 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
642 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
643 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
644 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
645 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
646 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
647 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
648 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
649 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
650 if (nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
651 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
652 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
653 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
654
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
655 /* Parse unibyte string at STR of LEN bytes, and return the number of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
656 bytes it may ocupy when converted to multibyte string by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
657 `str_to_multibyte'. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
658
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
659 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
660 parse_str_to_multibyte (str, len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
661 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
662 int len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
663 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
664 unsigned char *endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
665 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
666
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
667 for (bytes = 0; str < endp; str++)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
668 bytes += (*str < 0x80) ? 1 : 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
669 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
670 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
671
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
672
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
673 /* Convert unibyte text at STR of NBYTES bytes to a multibyte text
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
674 that contains the same single-byte characters. It actually
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
675 converts all 8-bit characters to multibyte forms. It is assured
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
676 that we can use LEN bytes at STR as a work area and that is
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
677 enough. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
678
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
679 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
680 str_to_multibyte (str, len, bytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
681 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
682 int len, bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
683 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
684 unsigned char *p = str, *endp = str + bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
685 unsigned char *to;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
686
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
687 while (p < endp && *p < 0x80) p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
688 if (p == endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
689 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
690 to = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
691 bytes = endp - p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
692 endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
693 safe_bcopy ((char *) p, (char *) (endp - bytes), bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
694 p = endp - bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
695 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
696 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
697 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
698
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
699 if (c >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
700 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
701 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
702 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
703 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
704 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
705
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
706 /* Arrange multibyte text at STR of LEN bytes as a unibyte text. It
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
707 actually converts characters in the range 0x80..0xFF to
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
708 unibyte. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
709
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
710 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
711 str_as_unibyte (str, bytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
712 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
713 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
714 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
715 unsigned char *p = str, *endp = str + bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
716 unsigned char *to = str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
717 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
718
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
719 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
720 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
721 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
722 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
723 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
724 break;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
725 p += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
726 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
727 to = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
728 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
729 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
730 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
731 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
732 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
733 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
734 c = STRING_CHAR_ADVANCE (p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
735 *to++ = CHAR_TO_BYTE8 (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
736 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
737 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
738 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
739 while (len--) *to++ = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
740 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
741 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
742 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
743 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
744
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
745 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
746 string_count_byte8 (string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
747 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
748 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
749 int multibyte = STRING_MULTIBYTE (string);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
750 int nchars = XSTRING (string)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
751 int nbytes = STRING_BYTES (XSTRING (string));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
752 unsigned char *p = XSTRING (string)->data;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
753 unsigned char *pend = p + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
754 int count = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
755 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
756
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
757 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
758 while (p < pend)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
759 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
760 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
761 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
762
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
763 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
764 count++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
765 p += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
766 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
767 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
768 while (p < pend)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
769 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
770 if (*p++ >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
771 count++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
772 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
773 return count;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
774 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
775
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
776
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
777 Lisp_Object
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
778 string_escape_byte8 (string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
779 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
780 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
781 int nchars = XSTRING (string)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
782 int nbytes = STRING_BYTES (XSTRING (string));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
783 int multibyte = STRING_MULTIBYTE (string);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
784 int byte8_count;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
785 unsigned char *src, *src_end, *dst;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
786 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
787 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
788
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
789 if (multibyte && nchars == nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
790 return string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
791
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
792 byte8_count = string_count_byte8 (string);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
793
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
794 if (byte8_count == 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
795 return string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
796
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
797 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
798 /* Convert 2-byte sequence of byte8 chars to 4-byte octal. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
799 val = make_uninit_multibyte_string (nchars + byte8_count * 2,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
800 nbytes + byte8_count * 2);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
801 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
802 /* Convert 1-byte sequence of byte8 chars to 4-byte octal. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
803 val = make_uninit_string (nbytes + byte8_count * 3);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
804
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
805 src = XSTRING (string)->data;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
806 src_end = src + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
807 dst = XSTRING (val)->data;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
808 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
809 while (src < src_end)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
810 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
811 c = *src;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
812 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
813
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
814 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
815 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
816 c = STRING_CHAR_ADVANCE (src);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
817 c = CHAR_TO_BYTE8 (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
818 sprintf (dst, "\\%03o", c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
819 dst += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
820 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
821 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
822 while (len--) *dst++ = *src++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
823 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
824 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
825 while (src < src_end)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
826 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
827 c = *src++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
828 if (c >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
829 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
830 sprintf (dst, "\\%03o", c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
831 dst += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
832 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
833 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
834 *dst++ = c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
835 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
836 return val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
837 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
838
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
839
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
840 DEFUN ("string", Fstring, Sstring, 1, MANY, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
841 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
842 Concatenate all the argument characters and make the result a string. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
843 (n, args)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
844 int n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
845 Lisp_Object *args;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
846 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
847 int i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
848 unsigned char *buf = (unsigned char *) alloca (MAX_MULTIBYTE_LENGTH * n);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
849 unsigned char *p = buf;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
850 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
851
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
852 for (i = 0; i < n; i++)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
853 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
854 CHECK_CHARACTER (args[i]);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
855 c = XINT (args[i]);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
856 p += CHAR_STRING (c, p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
857 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
858
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
859 return make_string_from_bytes ((char *) buf, n, p - buf);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
860 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
861
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
862 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
863 init_character_once ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
864 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
865 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
866
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
867 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
868
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
869 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
870 syms_of_character ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
871 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
872 DEFSYM (Qcharacterp, "characterp");
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
873 DEFSYM (Qauto_fill_chars, "auto-fill-chars");
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
874
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
875 staticpro (&Vchar_unify_table);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
876 Vchar_unify_table = Qnil;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
877
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
878 defsubr (&Smax_char);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
879 defsubr (&Scharacterp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
880 defsubr (&Sunibyte_char_to_multibyte);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
881 defsubr (&Smultibyte_char_to_unibyte);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
882 defsubr (&Schar_bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
883 defsubr (&Schar_width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
884 defsubr (&Sstring_width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
885 defsubr (&Schar_direction);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
886 defsubr (&Schars_in_region);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
887 defsubr (&Sstring);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
888
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
889 DEFVAR_LISP ("translation-table-vector", &Vtranslation_table_vector,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
890 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
891 Vector of cons cell of a symbol and translation table ever defined.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
892 An ID of a translation table is an index of this vector. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
893 Vtranslation_table_vector = Fmake_vector (make_number (16), Qnil);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
894
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
895 DEFVAR_LISP ("auto-fill-chars", &Vauto_fill_chars,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
896 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
897 A char-table for characters which invoke auto-filling.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
898 Such characters have value t in this table. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
899 Vauto_fill_chars = Fmake_char_table (Qauto_fill_chars, Qnil);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
900 CHAR_TABLE_SET (Vauto_fill_chars, make_number (' '), Qt);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
901 CHAR_TABLE_SET (Vauto_fill_chars, make_number ('\n'), Qt);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
902
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
903 DEFVAR_LISP ("char-width-table", &Vchar_width_table,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
904 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
905 A char-table for width (columns) of each character. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
906 Vchar_width_table = Fmake_char_table (Qnil, make_number (1));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
907
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
908 DEFVAR_LISP ("char-direction-table", &Vchar_direction_table,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
909 doc: /* A char-table for direction of each character. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
910 Vchar_direction_table = Fmake_char_table (Qnil, make_number (1));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
911
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
912 DEFVAR_LISP ("printable-chars", &Vprintable_chars,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
913 doc: /* A char-table for each printable character. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
914 Vprintable_chars = Fmake_char_table (Qnil, Qt);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
915 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
916
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
917 #endif /* emacs */