annotate src/character.c @ 90882:49d1cdd3b100

*** empty log message ***
author Jason Rumney <jasonr@gnu.org>
date Thu, 31 May 2007 14:53:18 +0000
parents fa02baec53ff
children ba60bd18bc0b
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1 /* Basic character support.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
2 Copyright (C) 1995, 1997, 1998, 2001 Electrotechnical Laboratory, JAPAN.
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
3 Licensed to the Free Software Foundation.
90424
4c7d4b278599 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 90403
diff changeset
4 Copyright (C) 2001, 2005, 2006 Free Software Foundation, Inc.
4c7d4b278599 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 90403
diff changeset
5 Copyright (C) 2003, 2006
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
7 Registration Number H13PRO009
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
8
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
9 This file is part of GNU Emacs.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
10
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
11 GNU Emacs is free software; you can redistribute it and/or modify
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
12 it under the terms of the GNU General Public License as published by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
13 the Free Software Foundation; either version 2, or (at your option)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
14 any later version.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
15
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
16 GNU Emacs is distributed in the hope that it will be useful,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
17 but WITHOUT ANY WARRANTY; without even the implied warranty of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
18 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
19 GNU General Public License for more details.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
20
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
21 You should have received a copy of the GNU General Public License
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
22 along with GNU Emacs; see the file COPYING. If not, write to
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
23 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
24 Boston, MA 02111-1307, USA. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
25
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
26 /* At first, see the document in `character.h' to understand the code
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
27 in this file. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
28
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
29 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
30 #include <config.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
31 #endif
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
32
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
33 #include <stdio.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
34
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
35 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
36
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
37 #include <sys/types.h>
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
38 #include "lisp.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
39 #include "character.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
40 #include "buffer.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
41 #include "charset.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
42 #include "composite.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
43 #include "disptab.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
44
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
45 #else /* not emacs */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
46
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
47 #include "mulelib.h"
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
48
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
49 #endif /* emacs */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
50
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
51 Lisp_Object Qcharacterp;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
52
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
53 /* Vector of translation table ever defined.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
54 ID of a translation table is used to index this vector. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
55 Lisp_Object Vtranslation_table_vector;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
56
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
57 /* A char-table for characters which may invoke auto-filling. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
58 Lisp_Object Vauto_fill_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
59
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
60 Lisp_Object Qauto_fill_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
61
89888
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
62 /* Char-table of information about which character to unify to which
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
63 Unicode character. */
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
64 Lisp_Object Vchar_unify_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
65
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
66 /* A char-table. An element is non-nil iff the corresponding
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
67 character has a printable glyph. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
68 Lisp_Object Vprintable_chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
69
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
70 /* A char-table. An elemnent is a column-width of the corresponding
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
71 character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
72 Lisp_Object Vchar_width_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
73
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
74 /* A char-table. An element is a symbol indicating the direction
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
75 property of corresponding character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
76 Lisp_Object Vchar_direction_table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
77
89020
b0277093a5f2 (_fetch_multibyte_char_len): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88990
diff changeset
78 /* Variable used locally in the macro FETCH_MULTIBYTE_CHAR. */
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
79 unsigned char *_fetch_multibyte_char_p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
80
88913
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
81 /* Char table of scripts. */
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
82 Lisp_Object Vchar_script_table;
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
83
90403
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
84 /* Alist of scripts vs representative characters. */
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
85 Lisp_Object Vscript_representative_chars;
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
86
88913
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
87 static Lisp_Object Qchar_script_table;
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
88
89054
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
89 /* Mapping table from unibyte chars to multibyte chars. */
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
90 int unibyte_to_multibyte_table[256];
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
91
90020
680f4ba0cdc9 (unibyte_has_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89911
diff changeset
92 /* Nth element is 1 iff unibyte char N can be mapped to a multibyte
680f4ba0cdc9 (unibyte_has_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89911
diff changeset
93 char. */
680f4ba0cdc9 (unibyte_has_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89911
diff changeset
94 char unibyte_has_multibyte_table[256];
680f4ba0cdc9 (unibyte_has_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89911
diff changeset
95
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
96
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
97
89888
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
98 /* Store multibyte form of character C at P. If C has modifier bits,
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
99 handle them appropriately. */
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
100
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
101 int
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
102 char_string (c, p)
90797
b74794d7f11a (char_string): Type of arg C changed to unsigned.
Kenichi Handa <handa@m17n.org>
parents: 90761
diff changeset
103 unsigned c;
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
104 unsigned char *p;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
105 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
106 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
107
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
108 if (c & CHAR_MODIFIER_MASK)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
109 {
89538
c719d9f420d1 (char_string): Use ASCII_CHAR_P instead of SINGLE_BYTE_CHAR_P.
Kenichi Handa <handa@m17n.org>
parents: 89511
diff changeset
110 /* As an non-ASCII character can't have modifier bits, we just
c719d9f420d1 (char_string): Use ASCII_CHAR_P instead of SINGLE_BYTE_CHAR_P.
Kenichi Handa <handa@m17n.org>
parents: 89511
diff changeset
111 ignore the bits. */
c719d9f420d1 (char_string): Use ASCII_CHAR_P instead of SINGLE_BYTE_CHAR_P.
Kenichi Handa <handa@m17n.org>
parents: 89511
diff changeset
112 if (ASCII_CHAR_P ((c & ~CHAR_MODIFIER_MASK)))
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
113 {
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
114 /* For Meta, Shift, and Control modifiers, we need special care. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
115 if (c & CHAR_META)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
116 {
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
117 /* Move the meta bit to the right place for a string. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
118 c = (c & ~CHAR_META) | 0x80;
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
119 }
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
120 if (c & CHAR_SHIFT)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
121 {
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
122 /* Shift modifier is valid only with [A-Za-z]. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
123 if ((c & 0377) >= 'A' && (c & 0377) <= 'Z')
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
124 c &= ~CHAR_SHIFT;
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
125 else if ((c & 0377) >= 'a' && (c & 0377) <= 'z')
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
126 c = (c & ~CHAR_SHIFT) - ('a' - 'A');
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
127 }
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
128 if (c & CHAR_CTL)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
129 {
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
130 /* Simulate the code in lread.c. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
131 /* Allow `\C- ' and `\C-?'. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
132 if (c == (CHAR_CTL | ' '))
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
133 c = 0;
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
134 else if (c == (CHAR_CTL | '?'))
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
135 c = 127;
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
136 /* ASCII control chars are made from letters (both cases),
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
137 as well as the non-letters within 0100...0137. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
138 else if ((c & 0137) >= 0101 && (c & 0137) <= 0132)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
139 c &= (037 | (~0177 & ~CHAR_CTL));
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
140 else if ((c & 0177) >= 0100 && (c & 0177) <= 0137)
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
141 c &= (037 | (~0177 & ~CHAR_CTL));
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
142 }
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
143 }
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
144
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
145 /* If C still has any modifier bits, just ignore it. */
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
146 c &= ~CHAR_MODIFIER_MASK;
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
147 }
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
148
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
149 MAYBE_UNIFY_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
150
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
151 if (c <= MAX_3_BYTE_CHAR)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
152 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
153 bytes = CHAR_STRING (c, p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
154 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
155 else if (c <= MAX_4_BYTE_CHAR)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
156 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
157 p[0] = (0xF0 | (c >> 18));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
158 p[1] = (0x80 | ((c >> 12) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
159 p[2] = (0x80 | ((c >> 6) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
160 p[3] = (0x80 | (c & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
161 bytes = 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
162 }
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
163 else if (c <= MAX_5_BYTE_CHAR)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
164 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
165 p[0] = 0xF8;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
166 p[1] = (0x80 | ((c >> 18) & 0x0F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
167 p[2] = (0x80 | ((c >> 12) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
168 p[3] = (0x80 | ((c >> 6) & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
169 p[4] = (0x80 | (c & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
170 bytes = 5;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
171 }
90797
b74794d7f11a (char_string): Type of arg C changed to unsigned.
Kenichi Handa <handa@m17n.org>
parents: 90761
diff changeset
172 else if (c <= MAX_CHAR)
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
173 {
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
174 c = CHAR_TO_BYTE8 (c);
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
175 bytes = BYTE8_STRING (c, p);
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
176 }
90797
b74794d7f11a (char_string): Type of arg C changed to unsigned.
Kenichi Handa <handa@m17n.org>
parents: 90761
diff changeset
177 else
b74794d7f11a (char_string): Type of arg C changed to unsigned.
Kenichi Handa <handa@m17n.org>
parents: 90761
diff changeset
178 error ("Invalid character: %d", c);
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
179
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
180 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
181 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
182
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
183
89888
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
184 /* Return a character whose multibyte form is at P. Set LEN is not
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
185 NULL, it must be a pointer to integer. In that case, set *LEN to
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
186 the byte length of the multibyte form. If ADVANCED is not NULL, is
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
187 must be a pointer to unsigned char. In that case, set *ADVANCED to
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
188 the ending address (i.e. the starting address of the next
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
189 character) of the multibyte form. */
cfd942ddfdab *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89757
diff changeset
190
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
191 int
89181
be75d5934738 (char_string): Renamed from
Kenichi Handa <handa@m17n.org>
parents: 89054
diff changeset
192 string_char (p, advanced, len)
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
193 const unsigned char *p;
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
194 const unsigned char **advanced;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
195 int *len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
196 {
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
197 int c;
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
198 const unsigned char *saved_p = p;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
199
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
200 if (*p < 0x80 || ! (*p & 0x20) || ! (*p & 0x10))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
201 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
202 c = STRING_CHAR_ADVANCE (p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
203 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
204 else if (! (*p & 0x08))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
205 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
206 c = ((((p)[0] & 0xF) << 18)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
207 | (((p)[1] & 0x3F) << 12)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
208 | (((p)[2] & 0x3F) << 6)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
209 | ((p)[3] & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
210 p += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
211 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
212 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
213 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
214 c = ((((p)[1] & 0x3F) << 18)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
215 | (((p)[2] & 0x3F) << 12)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
216 | (((p)[3] & 0x3F) << 6)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
217 | ((p)[4] & 0x3F));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
218 p += 5;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
219 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
220
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
221 MAYBE_UNIFY_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
222
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
223 if (len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
224 *len = p - saved_p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
225 if (advanced)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
226 *advanced = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
227 return c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
228 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
229
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
230
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
231 /* Translate character C by translation table TABLE. If C is
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
232 negative, translate a character specified by CHARSET and CODE. If
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
233 no translation is found in TABLE, return the untranslated
89757
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
234 character. If TABLE is a list, elements are char tables. In this
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
235 case, translace C by all tables. */
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
236
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
237 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
238 translate_char (table, c)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
239 Lisp_Object table;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
240 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
241 {
89757
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
242 if (CHAR_TABLE_P (table))
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
243 {
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
244 Lisp_Object ch;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
245
89757
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
246 ch = CHAR_TABLE_REF (table, c);
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
247 if (CHARACTERP (ch))
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
248 c = XINT (ch);
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
249 }
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
250 else
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
251 {
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
252 for (; CONSP (table); table = XCDR (table))
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
253 c = translate_char (XCAR (table), c);
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
254 }
482c15940000 (translate_char): Accept list of translation tables.
Kenichi Handa <handa@m17n.org>
parents: 89538
diff changeset
255 return c;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
256 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
257
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
258 /* Convert the multibyte character C to unibyte 8-bit character based
88983
2d504d707ce6 (unibyte_char_to_multibyte): Refer to
Kenichi Handa <handa@m17n.org>
parents: 88947
diff changeset
259 on the current value of charset_unibyte. If dimension of
2d504d707ce6 (unibyte_char_to_multibyte): Refer to
Kenichi Handa <handa@m17n.org>
parents: 88947
diff changeset
260 charset_unibyte is more than one, return (C & 0xFF).
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
261
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
262 The argument REV_TBL is now ignored. It will be removed in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
263 future. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
264
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
265 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
266 multibyte_char_to_unibyte (c, rev_tbl)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
267 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
268 Lisp_Object rev_tbl;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
269 {
89054
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
270 struct charset *charset;
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
271 unsigned c1;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
272
89054
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
273 if (CHAR_BYTE8_P (c))
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
274 return CHAR_TO_BYTE8 (c);
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
275 charset = CHARSET_FROM_ID (charset_unibyte);
8a6da305ac40 (unibyte_to_multibyte_table): New variable.
Kenichi Handa <handa@m17n.org>
parents: 89029
diff changeset
276 c1 = ENCODE_CHAR (charset, c);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
277 return ((c1 != CHARSET_INVALID_CODE (charset)) ? c1 : c & 0xFF);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
278 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
279
90761
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
280 /* Like multibyte_char_to_unibyte, but return -1 if C is not supported
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
281 by charset_unibyte. */
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
282
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
283 int
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
284 multibyte_char_to_unibyte_safe (c)
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
285 int c;
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
286 {
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
287 struct charset *charset;
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
288 unsigned c1;
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
289
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
290 if (CHAR_BYTE8_P (c))
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
291 return CHAR_TO_BYTE8 (c);
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
292 charset = CHARSET_FROM_ID (charset_unibyte);
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
293 c1 = ENCODE_CHAR (charset, c);
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
294 return ((c1 != CHARSET_INVALID_CODE (charset)) ? c1 : -1);
2951f3d44eba (multibyte_char_to_unibyte_safe): New function.
Kenichi Handa <handa@m17n.org>
parents: 90424
diff changeset
295 }
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
296
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
297 DEFUN ("characterp", Fcharacterp, Scharacterp, 1, 2, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
298 doc: /* Return non-nil if OBJECT is a character. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
299 (object, ignore)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
300 Lisp_Object object, ignore;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
301 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
302 return (CHARACTERP (object) ? Qt : Qnil);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
303 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
304
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
305 DEFUN ("max-char", Fmax_char, Smax_char, 0, 0, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
306 doc: /* Return the character of the maximum code. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
307 ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
308 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
309 return make_number (MAX_CHAR);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
310 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
311
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
312 DEFUN ("unibyte-char-to-multibyte", Funibyte_char_to_multibyte,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
313 Sunibyte_char_to_multibyte, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
314 doc: /* Convert the unibyte character CH to multibyte character.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
315 The multibyte character is a result of decoding CH by
88990
16317690f974 (Funibyte_char_to_multibyte): Doc fix.
Dave Love <fx@gnu.org>
parents: 88983
diff changeset
316 the current unibyte charset (see `unibyte-charset'). */)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
317 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
318 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
319 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
320 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
321 struct charset *charset;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
322
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
323 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
324 c = XFASTINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
325 if (c >= 0400)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
326 error ("Invalid unibyte character: %d", c);
88983
2d504d707ce6 (unibyte_char_to_multibyte): Refer to
Kenichi Handa <handa@m17n.org>
parents: 88947
diff changeset
327 charset = CHARSET_FROM_ID (charset_unibyte);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
328 c = DECODE_CHAR (charset, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
329 if (c < 0)
88947
894b8bce3208 (Funibyte_char_to_multibyte): If C can't be decoded
Kenichi Handa <handa@m17n.org>
parents: 88926
diff changeset
330 c = BYTE8_TO_CHAR (XFASTINT (ch));
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
331 return make_number (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
332 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
333
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
334 DEFUN ("multibyte-char-to-unibyte", Fmultibyte_char_to_unibyte,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
335 Smultibyte_char_to_unibyte, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
336 doc: /* Convert the multibyte character CH to unibyte character.\n\
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
337 The unibyte character is a result of encoding CH by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
338 the current primary charset (value of `charset-primary'). */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
339 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
340 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
341 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
342 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
343
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
344 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
345 c = XFASTINT (ch);
88947
894b8bce3208 (Funibyte_char_to_multibyte): If C can't be decoded
Kenichi Handa <handa@m17n.org>
parents: 88926
diff changeset
346 c = CHAR_TO_BYTE8 (c);
894b8bce3208 (Funibyte_char_to_multibyte): If C can't be decoded
Kenichi Handa <handa@m17n.org>
parents: 88926
diff changeset
347 return make_number (c);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
348 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
349
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
350 DEFUN ("char-bytes", Fchar_bytes, Schar_bytes, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
351 doc: /* Return 1 regardless of the argument CHAR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
352 This is now an obsolete function. We keep it just for backward compatibility. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
353 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
354 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
355 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
356 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
357 return make_number (1);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
358 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
359
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
360 DEFUN ("char-width", Fchar_width, Schar_width, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
361 doc: /* Return width of CHAR when displayed in the current buffer.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
362 The width is measured by how many columns it occupies on the screen.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
363 Tab is taken to occupy `tab-width' columns. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
364 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
365 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
366 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
367 Lisp_Object disp;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
368 int c, width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
369 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
370
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
371 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
372 c = XINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
373
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
374 /* Get the way the display table would display it. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
375 disp = dp ? DISP_CHAR_VECTOR (dp, c) : Qnil;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
376
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
377 if (VECTORP (disp))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
378 width = ASIZE (disp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
379 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
380 width = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
381
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
382 return make_number (width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
383 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
384
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
385 /* Return width of string STR of length LEN when displayed in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
386 current buffer. The width is measured by how many columns it
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
387 occupies on the screen. If PRECISION > 0, return the width of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
388 longest substring that doesn't exceed PRECISION, and set number of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
389 characters and bytes of the substring in *NCHARS and *NBYTES
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
390 respectively. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
391
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
392 int
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
393 c_string_width (str, len, precision, nchars, nbytes)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
394 const unsigned char *str;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
395 int precision, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
396 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
397 int i = 0, i_byte = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
398 int width = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
399 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
400
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
401 while (i_byte < len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
402 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
403 int bytes, thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
404 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
405 int c = STRING_CHAR_AND_LENGTH (str + i_byte, len - i_byte, bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
406
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
407 if (dp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
408 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
409 val = DISP_CHAR_VECTOR (dp, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
410 if (VECTORP (val))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
411 thiswidth = XVECTOR (val)->size;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
412 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
413 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
414 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
415 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
416 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
417 thiswidth = CHAR_WIDTH (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
418 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
419
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
420 if (precision > 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
421 && (width + thiswidth > precision))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
422 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
423 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
424 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
425 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
426 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
427 i++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
428 i_byte += bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
429 width += thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
430 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
431
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
432 if (precision > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
433 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
434 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
435 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
436 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
437
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
438 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
439 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
440
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
441 /* Return width of string STR of length LEN when displayed in the
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
442 current buffer. The width is measured by how many columns it
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
443 occupies on the screen. */
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
444
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
445 int
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
446 strwidth (str, len)
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
447 unsigned char *str;
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
448 int len;
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
449 {
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
450 return c_string_width (str, len, -1, NULL, NULL);
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
451 }
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
452
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
453 /* Return width of Lisp string STRING when displayed in the current
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
454 buffer. The width is measured by how many columns it occupies on
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
455 the screen while paying attention to compositions. If PRECISION >
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
456 0, return the width of longest substring that doesn't exceed
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
457 PRECISION, and set number of characters and bytes of the substring
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
458 in *NCHARS and *NBYTES respectively. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
459
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
460 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
461 lisp_string_width (string, precision, nchars, nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
462 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
463 int precision, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
464 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
465 int len = SCHARS (string);
90256
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
466 /* This set multibyte to 0 even if STRING is multibyte when it
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
467 contains only ascii and eight-bit-graphic, but that's
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
468 intentional. */
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
469 int multibyte = len < SBYTES (string);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
470 unsigned char *str = SDATA (string);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
471 int i = 0, i_byte = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
472 int width = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
473 struct Lisp_Char_Table *dp = buffer_display_table ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
474
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
475 while (i < len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
476 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
477 int chars, bytes, thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
478 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
479 int cmp_id;
89511
bae1254b8517 (lisp_string_width): Make ignore and end EMACS_INT.
Dave Love <fx@gnu.org>
parents: 89483
diff changeset
480 EMACS_INT ignore, end;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
481
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
482 if (find_composition (i, -1, &ignore, &end, &val, string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
483 && ((cmp_id = get_composition_id (i, i_byte, end - i, val, string))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
484 >= 0))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
485 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
486 thiswidth = composition_table[cmp_id]->width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
487 chars = end - i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
488 bytes = string_char_to_byte (string, end) - i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
489 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
490 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
491 {
90256
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
492 int c;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
493
90256
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
494 if (multibyte)
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
495 c = STRING_CHAR_AND_LENGTH (str + i_byte, len - i_byte, bytes);
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
496 else
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
497 c = str[i_byte], bytes = 1;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
498 chars = 1;
90256
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
499 if (dp)
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
500 {
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
501 val = DISP_CHAR_VECTOR (dp, c);
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
502 if (VECTORP (val))
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
503 thiswidth = XVECTOR (val)->size;
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
504 else
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
505 thiswidth = CHAR_WIDTH (c);
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
506 }
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
507 else
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
508 {
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
509 thiswidth = CHAR_WIDTH (c);
d4755c5aa57d (lisp_string_width): Check multibyteness of STRING.
Kenichi Handa <handa@m17n.org>
parents: 90159
diff changeset
510 }
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
511 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
512
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
513 if (precision > 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
514 && (width + thiswidth > precision))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
515 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
516 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
517 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
518 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
519 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
520 i += chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
521 i_byte += bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
522 width += thiswidth;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
523 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
524
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
525 if (precision > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
526 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
527 *nchars = i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
528 *nbytes = i_byte;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
529 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
530
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
531 return width;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
532 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
533
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
534 DEFUN ("string-width", Fstring_width, Sstring_width, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
535 doc: /* Return width of STRING when displayed in the current buffer.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
536 Width is measured by how many columns it occupies on the screen.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
537 When calculating width of a multibyte character in STRING,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
538 only the base leading-code is considered; the validity of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
539 the following bytes is not checked. Tabs in STRING are always
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
540 taken to occupy `tab-width' columns. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
541 (str)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
542 Lisp_Object str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
543 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
544 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
545
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
546 CHECK_STRING (str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
547 XSETFASTINT (val, lisp_string_width (str, -1, NULL, NULL));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
548 return val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
549 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
550
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
551 DEFUN ("char-direction", Fchar_direction, Schar_direction, 1, 1, 0,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
552 doc: /* Return the direction of CHAR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
553 The returned value is 0 for left-to-right and 1 for right-to-left. */)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
554 (ch)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
555 Lisp_Object ch;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
556 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
557 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
558
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
559 CHECK_CHARACTER (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
560 c = XINT (ch);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
561 return CHAR_TABLE_REF (Vchar_direction_table, c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
562 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
563
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
564 /* Return the number of characters in the NBYTES bytes at PTR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
565 This works by looking at the contents and checking for multibyte
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
566 sequences while assuming that there's no invalid sequence.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
567 However, if the current buffer has enable-multibyte-characters =
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
568 nil, we treat each byte as a character. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
569
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
570 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
571 chars_in_text (ptr, nbytes)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
572 const unsigned char *ptr;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
573 int nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
574 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
575 /* current_buffer is null at early stages of Emacs initialization. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
576 if (current_buffer == 0
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
577 || NILP (current_buffer->enable_multibyte_characters))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
578 return nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
579
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
580 return multibyte_chars_in_text (ptr, nbytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
581 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
582
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
583 /* Return the number of characters in the NBYTES bytes at PTR.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
584 This works by looking at the contents and checking for multibyte
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
585 sequences while assuming that there's no invalid sequence. It
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
586 ignores enable-multibyte-characters. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
587
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
588 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
589 multibyte_chars_in_text (ptr, nbytes)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
590 const unsigned char *ptr;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
591 int nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
592 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
593 const unsigned char *endp = ptr + nbytes;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
594 int chars = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
595
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
596 while (ptr < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
597 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
598 int len = MULTIBYTE_LENGTH (ptr, endp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
599
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
600 if (len == 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
601 abort ();
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
602 ptr += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
603 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
604 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
605
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
606 return chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
607 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
608
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
609 /* Parse unibyte text at STR of LEN bytes as a multibyte text, count
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
610 characters and bytes in it, and store them in *NCHARS and *NBYTES
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
611 respectively. On counting bytes, pay attention to that 8-bit
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
612 characters not constructing a valid multibyte sequence are
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
613 represented by 2-byte in a multibyte text. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
614
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
615 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
616 parse_str_as_multibyte (str, len, nchars, nbytes)
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
617 const unsigned char *str;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
618 int len, *nchars, *nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
619 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
620 const unsigned char *endp = str + len;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
621 int n, chars = 0, bytes = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
622
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
623 if (len >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
624 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
625 const unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
626 while (str < adjusted_endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
627 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
628 if ((n = MULTIBYTE_LENGTH_NO_CHECK (str)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
629 str += n, bytes += n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
630 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
631 str++, bytes += 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
632 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
633 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
634 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
635 while (str < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
636 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
637 if ((n = MULTIBYTE_LENGTH (str, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
638 str += n, bytes += n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
639 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
640 str++, bytes += 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
641 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
642 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
643
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
644 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
645 *nbytes = bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
646 return;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
647 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
648
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
649 /* Arrange unibyte text at STR of NBYTES bytes as a multibyte text.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
650 It actually converts only such 8-bit characters that don't contruct
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
651 a multibyte sequence to multibyte forms of Latin-1 characters. If
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
652 NCHARS is nonzero, set *NCHARS to the number of characters in the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
653 text. It is assured that we can use LEN bytes at STR as a work
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
654 area and that is enough. Return the number of bytes of the
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
655 resulting text. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
656
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
657 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
658 str_as_multibyte (str, len, nbytes, nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
659 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
660 int len, nbytes, *nchars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
661 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
662 unsigned char *p = str, *endp = str + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
663 unsigned char *to;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
664 int chars = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
665 int n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
666
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
667 if (nbytes >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
668 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
669 unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
670 while (p < adjusted_endp
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
671 && (n = MULTIBYTE_LENGTH_NO_CHECK (p)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
672 p += n, chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
673 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
674 while ((n = MULTIBYTE_LENGTH (p, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
675 p += n, chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
676 if (nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
677 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
678 if (p == endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
679 return nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
680
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
681 to = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
682 nbytes = endp - p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
683 endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
684 safe_bcopy ((char *) p, (char *) (endp - nbytes), nbytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
685 p = endp - nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
686
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
687 if (nbytes >= MAX_MULTIBYTE_LENGTH)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
688 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
689 unsigned char *adjusted_endp = endp - MAX_MULTIBYTE_LENGTH;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
690 while (p < adjusted_endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
691 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
692 if ((n = MULTIBYTE_LENGTH_NO_CHECK (p)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
693 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
694 while (n--)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
695 *to++ = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
696 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
697 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
698 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
699 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
700 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
701 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
702 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
703 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
704 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
705 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
706 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
707 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
708 if ((n = MULTIBYTE_LENGTH (p, endp)) > 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
709 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
710 while (n--)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
711 *to++ = *p++;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
712 }
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
713 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
714 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
715 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
716 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
717 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
718 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
719 chars++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
720 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
721 if (nchars)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
722 *nchars = chars;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
723 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
724 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
725
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
726 /* Parse unibyte string at STR of LEN bytes, and return the number of
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
727 bytes it may ocupy when converted to multibyte string by
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
728 `str_to_multibyte'. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
729
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
730 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
731 parse_str_to_multibyte (str, len)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
732 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
733 int len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
734 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
735 unsigned char *endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
736 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
737
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
738 for (bytes = 0; str < endp; str++)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
739 bytes += (*str < 0x80) ? 1 : 2;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
740 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
741 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
742
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
743
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
744 /* Convert unibyte text at STR of NBYTES bytes to a multibyte text
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
745 that contains the same single-byte characters. It actually
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
746 converts all 8-bit characters to multibyte forms. It is assured
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
747 that we can use LEN bytes at STR as a work area and that is
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
748 enough. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
749
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
750 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
751 str_to_multibyte (str, len, bytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
752 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
753 int len, bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
754 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
755 unsigned char *p = str, *endp = str + bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
756 unsigned char *to;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
757
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
758 while (p < endp && *p < 0x80) p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
759 if (p == endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
760 return bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
761 to = p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
762 bytes = endp - p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
763 endp = str + len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
764 safe_bcopy ((char *) p, (char *) (endp - bytes), bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
765 p = endp - bytes;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
766 while (p < endp)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
767 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
768 int c = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
769
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
770 if (c >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
771 c = BYTE8_TO_CHAR (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
772 to += CHAR_STRING (c, to);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
773 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
774 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
775 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
776
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
777 /* Arrange multibyte text at STR of LEN bytes as a unibyte text. It
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
778 actually converts characters in the range 0x80..0xFF to
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
779 unibyte. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
780
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
781 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
782 str_as_unibyte (str, bytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
783 unsigned char *str;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
784 int bytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
785 {
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
786 const unsigned char *p = str, *endp = str + bytes;
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
787 unsigned char *to;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
788 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
789
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
790 while (p < endp)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
791 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
792 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
793 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
794 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
795 break;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
796 p += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
797 }
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
798 to = str + (p - str);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
799 while (p < endp)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
800 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
801 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
802 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
803 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
804 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
805 c = STRING_CHAR_ADVANCE (p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
806 *to++ = CHAR_TO_BYTE8 (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
807 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
808 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
809 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
810 while (len--) *to++ = *p++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
811 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
812 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
813 return (to - str);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
814 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
815
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
816 int
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
817 string_count_byte8 (string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
818 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
819 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
820 int multibyte = STRING_MULTIBYTE (string);
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
821 int nbytes = SBYTES (string);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
822 unsigned char *p = SDATA (string);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
823 unsigned char *pend = p + nbytes;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
824 int count = 0;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
825 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
826
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
827 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
828 while (p < pend)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
829 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
830 c = *p;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
831 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
832
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
833 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
834 count++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
835 p += len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
836 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
837 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
838 while (p < pend)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
839 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
840 if (*p++ >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
841 count++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
842 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
843 return count;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
844 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
845
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
846
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
847 Lisp_Object
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
848 string_escape_byte8 (string)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
849 Lisp_Object string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
850 {
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
851 int nchars = SCHARS (string);
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
852 int nbytes = SBYTES (string);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
853 int multibyte = STRING_MULTIBYTE (string);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
854 int byte8_count;
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
855 const unsigned char *src, *src_end;
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
856 unsigned char *dst;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
857 Lisp_Object val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
858 int c, len;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
859
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
860 if (multibyte && nchars == nbytes)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
861 return string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
862
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
863 byte8_count = string_count_byte8 (string);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
864
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
865 if (byte8_count == 0)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
866 return string;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
867
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
868 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
869 /* Convert 2-byte sequence of byte8 chars to 4-byte octal. */
88526
6bac4ae1c326 (string_escape_byte8): Make multibyte string with correct size.
Kenichi Handa <handa@m17n.org>
parents: 88427
diff changeset
870 val = make_uninit_multibyte_string (nchars + byte8_count * 3,
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
871 nbytes + byte8_count * 2);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
872 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
873 /* Convert 1-byte sequence of byte8 chars to 4-byte octal. */
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
874 val = make_uninit_string (nbytes + byte8_count * 3);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
875
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
876 src = SDATA (string);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
877 src_end = src + nbytes;
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
878 dst = SDATA (val);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
879 if (multibyte)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
880 while (src < src_end)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
881 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
882 c = *src;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
883 len = BYTES_BY_CHAR_HEAD (c);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
884
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
885 if (CHAR_BYTE8_HEAD_P (c))
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
886 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
887 c = STRING_CHAR_ADVANCE (src);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
888 c = CHAR_TO_BYTE8 (c);
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
889 sprintf ((char *) dst, "\\%03o", c);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
890 dst += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
891 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
892 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
893 while (len--) *dst++ = *src++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
894 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
895 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
896 while (src < src_end)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
897 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
898 c = *src++;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
899 if (c >= 0x80)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
900 {
88427
1a3aec316071 (c_string_width): Add return type `int'.
Kenichi Handa <handa@m17n.org>
parents: 88363
diff changeset
901 sprintf ((char *) dst, "\\%03o", c);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
902 dst += 4;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
903 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
904 else
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
905 *dst++ = c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
906 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
907 return val;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
908 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
909
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
910
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 89181
diff changeset
911 DEFUN ("string", Fstring, Sstring, 0, MANY, 0,
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
912 doc: /*
88640
90a6e8c61273 (Fstring): Doc fix.
Dave Love <fx@gnu.org>
parents: 88526
diff changeset
913 Concatenate all the argument characters and make the result a string.
90a6e8c61273 (Fstring): Doc fix.
Dave Love <fx@gnu.org>
parents: 88526
diff changeset
914 usage: (string &rest CHARACTERS) */)
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
915 (n, args)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
916 int n;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
917 Lisp_Object *args;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
918 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
919 int i;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
920 unsigned char *buf = (unsigned char *) alloca (MAX_MULTIBYTE_LENGTH * n);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
921 unsigned char *p = buf;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
922 int c;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
923
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
924 for (i = 0; i < n; i++)
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
925 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
926 CHECK_CHARACTER (args[i]);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
927 c = XINT (args[i]);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
928 p += CHAR_STRING (c, p);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
929 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
930
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
931 return make_string_from_bytes ((char *) buf, n, p - buf);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
932 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
933
90841
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
934 DEFUN ("unibyte-string", Funibyte_string, Sunibyte_string, 0, MANY, 0,
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
935 doc: /* Concatenate all the argument bytes and make the result a unibyte string. */)
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
936 (n, args)
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
937 int n;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
938 Lisp_Object *args;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
939 {
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
940 int i;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
941 unsigned char *buf = (unsigned char *) alloca (n);
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
942 unsigned char *p = buf;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
943 unsigned c;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
944
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
945 for (i = 0; i < n; i++)
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
946 {
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
947 CHECK_NATNUM (args[i]);
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
948 c = XFASTINT (args[i]);
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
949 if (c >= 256)
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
950 args_out_of_range_3 (args[i], make_number (0), make_number (255));
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
951 *p++ = c;
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
952 }
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
953
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
954 return make_string_from_bytes ((char *) buf, n, p - buf);
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
955 }
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
956
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
957 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
958 init_character_once ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
959 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
960 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
961
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
962 #ifdef emacs
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
963
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
964 void
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
965 syms_of_character ()
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
966 {
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
967 DEFSYM (Qcharacterp, "characterp");
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
968 DEFSYM (Qauto_fill_chars, "auto-fill-chars");
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
969
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
970 staticpro (&Vchar_unify_table);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
971 Vchar_unify_table = Qnil;
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
972
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
973 defsubr (&Smax_char);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
974 defsubr (&Scharacterp);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
975 defsubr (&Sunibyte_char_to_multibyte);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
976 defsubr (&Smultibyte_char_to_unibyte);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
977 defsubr (&Schar_bytes);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
978 defsubr (&Schar_width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
979 defsubr (&Sstring_width);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
980 defsubr (&Schar_direction);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
981 defsubr (&Sstring);
90841
fa02baec53ff (Funibyte_string): New function.
Kenichi Handa <handa@m17n.org>
parents: 90797
diff changeset
982 defsubr (&Sunibyte_string);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
983
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
984 DEFVAR_LISP ("translation-table-vector", &Vtranslation_table_vector,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
985 doc: /*
88926
f026b7e4fc61 (syms_of_character) <translation-table-vector>: Doc
Dave Love <fx@gnu.org>
parents: 88913
diff changeset
986 Vector recording all translation tables ever defined.
f026b7e4fc61 (syms_of_character) <translation-table-vector>: Doc
Dave Love <fx@gnu.org>
parents: 88913
diff changeset
987 Each element is a pair (SYMBOL . TABLE) relating the table to the
f026b7e4fc61 (syms_of_character) <translation-table-vector>: Doc
Dave Love <fx@gnu.org>
parents: 88913
diff changeset
988 symbol naming it. The ID of a translation table is an index into this vector. */);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
989 Vtranslation_table_vector = Fmake_vector (make_number (16), Qnil);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
990
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
991 DEFVAR_LISP ("auto-fill-chars", &Vauto_fill_chars,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
992 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
993 A char-table for characters which invoke auto-filling.
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
994 Such characters have value t in this table. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
995 Vauto_fill_chars = Fmake_char_table (Qauto_fill_chars, Qnil);
88853
503c60238368 (syms_of_character): Fix CHAR_TABLE_SET call.
Dave Love <fx@gnu.org>
parents: 88743
diff changeset
996 CHAR_TABLE_SET (Vauto_fill_chars, ' ', Qt);
503c60238368 (syms_of_character): Fix CHAR_TABLE_SET call.
Dave Love <fx@gnu.org>
parents: 88743
diff changeset
997 CHAR_TABLE_SET (Vauto_fill_chars, '\n', Qt);
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
998
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
999 DEFVAR_LISP ("char-width-table", &Vchar_width_table,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1000 doc: /*
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1001 A char-table for width (columns) of each character. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1002 Vchar_width_table = Fmake_char_table (Qnil, make_number (1));
88743
4570f1a4c391 (syms_of_character): Setup Vchar_width_table for
Kenichi Handa <handa@m17n.org>
parents: 88716
diff changeset
1003 char_table_set_range (Vchar_width_table, 0x80, 0x9F, make_number (4));
4570f1a4c391 (syms_of_character): Setup Vchar_width_table for
Kenichi Handa <handa@m17n.org>
parents: 88716
diff changeset
1004 char_table_set_range (Vchar_width_table, MAX_5_BYTE_CHAR + 1, MAX_CHAR,
4570f1a4c391 (syms_of_character): Setup Vchar_width_table for
Kenichi Handa <handa@m17n.org>
parents: 88716
diff changeset
1005 make_number (4));
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1006
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1007 DEFVAR_LISP ("char-direction-table", &Vchar_direction_table,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1008 doc: /* A char-table for direction of each character. */);
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1009 Vchar_direction_table = Fmake_char_table (Qnil, make_number (1));
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1010
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1011 DEFVAR_LISP ("printable-chars", &Vprintable_chars,
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1012 doc: /* A char-table for each printable character. */);
88716
f617b1bf301b (syms_of_character): Set the default value of
Kenichi Handa <handa@m17n.org>
parents: 88640
diff changeset
1013 Vprintable_chars = Fmake_char_table (Qnil, Qnil);
89029
ad8f56efa7c6 (syms_of_character): Setup Vprintable_chars.
Kenichi Handa <handa@m17n.org>
parents: 89020
diff changeset
1014 Fset_char_table_range (Vprintable_chars,
ad8f56efa7c6 (syms_of_character): Setup Vprintable_chars.
Kenichi Handa <handa@m17n.org>
parents: 89020
diff changeset
1015 Fcons (make_number (32), make_number (126)), Qt);
ad8f56efa7c6 (syms_of_character): Setup Vprintable_chars.
Kenichi Handa <handa@m17n.org>
parents: 89020
diff changeset
1016 Fset_char_table_range (Vprintable_chars,
ad8f56efa7c6 (syms_of_character): Setup Vprintable_chars.
Kenichi Handa <handa@m17n.org>
parents: 89020
diff changeset
1017 Fcons (make_number (160),
ad8f56efa7c6 (syms_of_character): Setup Vprintable_chars.
Kenichi Handa <handa@m17n.org>
parents: 89020
diff changeset
1018 make_number (MAX_5_BYTE_CHAR)), Qt);
88878
a0ae1a5876c7 (Vscript_alist): New variable.
Kenichi Handa <handa@m17n.org>
parents: 88853
diff changeset
1019
88913
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1020 DEFVAR_LISP ("char-script-table", &Vchar_script_table,
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1021 doc: /* Char table of script symbols.
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1022 It has one extra slot whose value is a list of script symbols. */);
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1023
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1024 /* Intern this now in case it isn't already done.
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1025 Setting this variable twice is harmless.
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1026 But don't staticpro it here--that is done in alloc.c. */
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1027 Qchar_table_extra_slots = intern ("char-table-extra-slots");
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1028 DEFSYM (Qchar_script_table, "char-script-table");
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1029 Fput (Qchar_script_table, Qchar_table_extra_slots, make_number (1));
76074dea1258 (Vscript_alist): This variable deleted.
Kenichi Handa <handa@m17n.org>
parents: 88878
diff changeset
1030 Vchar_script_table = Fmake_char_table (Qchar_script_table, Qnil);
90403
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
1031
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
1032 DEFVAR_LISP ("script-representative-chars", &Vscript_representative_chars,
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
1033 doc: /* Alist of scripts vs the representative characters. */);
81f1bbab281f (Vscript_representative_chars): New variable.
Kenichi Handa <handa@m17n.org>
parents: 90256
diff changeset
1034 Vscript_representative_chars = Qnil;
88363
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1035 }
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1036
13b9026422e0 New file.
Kenichi Handa <handa@m17n.org>
parents:
diff changeset
1037 #endif /* emacs */
89911
cce857c68ba2 Add arch taglines
Miles Bader <miles@gnu.org>
parents: 89888
diff changeset
1038
cce857c68ba2 Add arch taglines
Miles Bader <miles@gnu.org>
parents: 89888
diff changeset
1039 /* arch-tag: b6665960-3c3d-4184-85cd-af4318197999
cce857c68ba2 Add arch taglines
Miles Bader <miles@gnu.org>
parents: 89888
diff changeset
1040 (do not change this comment) */