Mercurial > audlegacy
comparison src/audacious/strings.c @ 2313:3149d4b1a9a9 trunk
[svn] - objective-make autodepend fixes
- move all sourcecode into src/ and adjust Makefiles accordingly
author | nenolod |
---|---|
date | Fri, 12 Jan 2007 11:43:40 -0800 |
parents | |
children | 593fd166af00 |
comparison
equal
deleted
inserted
replaced
2312:e1a5a66fb9cc | 2313:3149d4b1a9a9 |
---|---|
1 /* Audacious | |
2 * Copyright (C) 2005-2007 Audacious development team. | |
3 * | |
4 * BMP - Cross-platform multimedia player | |
5 * Copyright (C) 2003-2004 BMP development team. | |
6 * | |
7 * Based on XMMS: | |
8 * Copyright (C) 1998-2003 XMMS development team. | |
9 * | |
10 * This program is free software; you can redistribute it and/or modify | |
11 * it under the terms of the GNU General Public License as published by | |
12 * the Free Software Foundation; under version 2 of the License. | |
13 * | |
14 * This program is distributed in the hope that it will be useful, | |
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
17 * GNU General Public License for more details. | |
18 * | |
19 * You should have received a copy of the GNU General Public License | |
20 * along with this program; if not, write to the Free Software | |
21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA | |
22 * 02110-1301, USA. | |
23 */ | |
24 | |
25 #define WEIRD_UTF_16_PLAYLIST_ENCODING | |
26 | |
27 #ifdef HAVE_CONFIG_H | |
28 # include "config.h" | |
29 #endif | |
30 | |
31 #define NEED_GLADE | |
32 #include "util.h" | |
33 | |
34 #include <glib.h> | |
35 #include <glib/gi18n.h> | |
36 #include <glade/glade.h> | |
37 #include <gtk/gtk.h> | |
38 #include <stdio.h> | |
39 #include <stdlib.h> | |
40 #include <string.h> | |
41 #include <ctype.h> | |
42 | |
43 #include "platform/smartinclude.h" | |
44 #include <gdk/gdkkeysyms.h> | |
45 #include <X11/Xlib.h> | |
46 //#include <sys/ipc.h> | |
47 #include <unistd.h> | |
48 #include <errno.h> | |
49 | |
50 #ifdef HAVE_FTS_H | |
51 # include <fts.h> | |
52 #endif | |
53 | |
54 #include "glade.h" | |
55 #include "input.h" | |
56 #include "main.h" | |
57 #include "playback.h" | |
58 #include "playlist.h" | |
59 #include "ui_playlist.h" | |
60 | |
61 #ifdef USE_CHARDET | |
62 #include "../libguess/libguess.h" | |
63 #include "../librcd/librcd.h" | |
64 #ifdef HAVE_UDET | |
65 #include <libudet_c.h> | |
66 #endif | |
67 #endif | |
68 | |
69 static GQuark quark_popup_data; | |
70 | |
71 | |
72 /* | |
73 * escape_shell_chars() | |
74 * | |
75 * Escapes characters that are special to the shell inside double quotes. | |
76 */ | |
77 | |
78 gchar * | |
79 escape_shell_chars(const gchar * string) | |
80 { | |
81 const gchar *special = "$`\"\\"; /* Characters to escape */ | |
82 const gchar *in = string; | |
83 gchar *out, *escaped; | |
84 gint num = 0; | |
85 | |
86 while (*in != '\0') | |
87 if (strchr(special, *in++)) | |
88 num++; | |
89 | |
90 escaped = g_malloc(strlen(string) + num + 1); | |
91 | |
92 in = string; | |
93 out = escaped; | |
94 | |
95 while (*in != '\0') { | |
96 if (strchr(special, *in)) | |
97 *out++ = '\\'; | |
98 *out++ = *in++; | |
99 } | |
100 *out = '\0'; | |
101 | |
102 return escaped; | |
103 } | |
104 | |
105 static gchar * | |
106 str_twenty_to_space(gchar * str) | |
107 { | |
108 gchar *match, *match_end; | |
109 | |
110 g_return_val_if_fail(str != NULL, NULL); | |
111 | |
112 while ((match = strstr(str, "%20"))) { | |
113 match_end = match + 3; | |
114 *match++ = ' '; | |
115 while (*match_end) | |
116 *match++ = *match_end++; | |
117 *match = 0; | |
118 } | |
119 | |
120 return str; | |
121 } | |
122 | |
123 static gchar * | |
124 str_replace_char(gchar * str, gchar old, gchar new) | |
125 { | |
126 gchar *match; | |
127 | |
128 g_return_val_if_fail(str != NULL, NULL); | |
129 | |
130 match = str; | |
131 while ((match = strchr(match, old))) | |
132 *match = new; | |
133 | |
134 return str; | |
135 } | |
136 | |
137 gchar * | |
138 str_append(gchar * str, const gchar * add_str) | |
139 { | |
140 return str_replace(str, g_strconcat(str, add_str, NULL)); | |
141 } | |
142 | |
143 gchar * | |
144 str_replace(gchar * str, gchar * new_str) | |
145 { | |
146 g_free(str); | |
147 return new_str; | |
148 } | |
149 | |
150 void | |
151 str_replace_in(gchar ** str, gchar * new_str) | |
152 { | |
153 *str = str_replace(*str, new_str); | |
154 } | |
155 | |
156 | |
157 gboolean | |
158 str_has_prefix_nocase(const gchar * str, const gchar * prefix) | |
159 { | |
160 return (strncasecmp(str, prefix, strlen(prefix)) == 0); | |
161 } | |
162 | |
163 gboolean | |
164 str_has_suffix_nocase(const gchar * str, const gchar * suffix) | |
165 { | |
166 return (strcasecmp(str + strlen(str) - strlen(suffix), suffix) == 0); | |
167 } | |
168 | |
169 gboolean | |
170 str_has_suffixes_nocase(const gchar * str, gchar * const *suffixes) | |
171 { | |
172 gchar *const *suffix; | |
173 | |
174 g_return_val_if_fail(str != NULL, FALSE); | |
175 g_return_val_if_fail(suffixes != NULL, FALSE); | |
176 | |
177 for (suffix = suffixes; *suffix; suffix++) | |
178 if (str_has_suffix_nocase(str, *suffix)) | |
179 return TRUE; | |
180 | |
181 return FALSE; | |
182 } | |
183 | |
184 gchar * | |
185 str_to_utf8_fallback(const gchar * str) | |
186 { | |
187 gchar *out_str, *convert_str, *chr; | |
188 | |
189 /* NULL in NULL out */ | |
190 if (!str) | |
191 return NULL; | |
192 | |
193 convert_str = g_strdup(str); | |
194 for (chr = convert_str; *chr; chr++) { | |
195 if (*chr & 0x80) | |
196 *chr = '?'; | |
197 } | |
198 | |
199 out_str = g_strconcat(convert_str, _(" (invalid UTF-8)"), NULL); | |
200 g_free(convert_str); | |
201 | |
202 return out_str; | |
203 } | |
204 | |
205 gchar * | |
206 filename_to_utf8(const gchar * filename) | |
207 { | |
208 gchar *out_str; | |
209 | |
210 /* NULL in NULL out */ | |
211 if (!filename) | |
212 return NULL; | |
213 | |
214 if ((out_str = g_filename_to_utf8(filename, -1, NULL, NULL, NULL))) | |
215 return out_str; | |
216 | |
217 return str_to_utf8_fallback(filename); | |
218 } | |
219 | |
220 gchar * | |
221 str_to_utf8(const gchar * str) | |
222 { | |
223 gchar *out_str; | |
224 | |
225 /* NULL in NULL out */ | |
226 if (!str) | |
227 return NULL; | |
228 | |
229 /* Note: Currently, playlist calls this function repeatedly, even | |
230 * if the string is already converted into utf-8. | |
231 * chardet_to_utf8() would convert a valid utf-8 string into a | |
232 * different utf-8 string, if fallback encodings were supplied and | |
233 * the given string could be treated as a string in one of fallback | |
234 * encodings. To avoid this, the order of evaluation has been | |
235 * changed. (It might cause a drawback?) | |
236 */ | |
237 /* chardet encoding detector */ | |
238 if ((out_str = chardet_to_utf8(str, strlen(str), NULL, NULL, NULL))) | |
239 return out_str; | |
240 | |
241 /* already UTF-8? */ | |
242 if (g_utf8_validate(str, -1, NULL)) | |
243 return g_strdup(str); | |
244 | |
245 /* assume encoding associated with locale */ | |
246 if ((out_str = g_locale_to_utf8(str, -1, NULL, NULL, NULL))) | |
247 return out_str; | |
248 | |
249 /* all else fails, we mask off character codes >= 128, | |
250 replace with '?' */ | |
251 return str_to_utf8_fallback(str); | |
252 } | |
253 | |
254 | |
255 const gchar * | |
256 str_skip_chars(const gchar * str, const gchar * chars) | |
257 { | |
258 while (strchr(chars, *str)) | |
259 str++; | |
260 return str; | |
261 } | |
262 | |
263 gchar * | |
264 convert_title_text(gchar * title) | |
265 { | |
266 g_return_val_if_fail(title != NULL, NULL); | |
267 | |
268 if (cfg.convert_slash) | |
269 str_replace_char(title, '\\', '/'); | |
270 | |
271 if (cfg.convert_underscore) | |
272 str_replace_char(title, '_', ' '); | |
273 | |
274 if (cfg.convert_twenty) | |
275 str_twenty_to_space(title); | |
276 | |
277 return title; | |
278 } | |
279 | |
280 gchar *chardet_to_utf8(const gchar *str, gssize len, | |
281 gsize *arg_bytes_read, gsize *arg_bytes_write, GError **arg_error) | |
282 { | |
283 #ifdef USE_CHARDET | |
284 char *det = NULL, *encoding = NULL; | |
285 #endif | |
286 gchar *ret = NULL; | |
287 gsize *bytes_read, *bytes_write; | |
288 GError **error; | |
289 gsize my_bytes_read, my_bytes_write; | |
290 | |
291 bytes_read = arg_bytes_read ? arg_bytes_read : &my_bytes_read; | |
292 bytes_write = arg_bytes_write ? arg_bytes_write : &my_bytes_write; | |
293 error = arg_error ? arg_error : NULL; | |
294 | |
295 #ifdef USE_CHARDET | |
296 if(cfg.chardet_detector) | |
297 det = cfg.chardet_detector; | |
298 | |
299 if(det){ | |
300 if(!strncasecmp("japanese", det, sizeof("japanese"))) { | |
301 encoding = (char *)guess_jp(str, strlen(str)); | |
302 if (!encoding) | |
303 goto fallback; | |
304 } else if(!strncasecmp("taiwanese", det, sizeof("taiwanese"))) { | |
305 encoding = (char *)guess_tw(str, strlen(str)); | |
306 if (!encoding) | |
307 goto fallback; | |
308 } else if(!strncasecmp("chinese", det, sizeof("chinese"))) { | |
309 encoding = (char *)guess_cn(str, strlen(str)); | |
310 if (!encoding) | |
311 goto fallback; | |
312 } else if(!strncasecmp("korean", det, sizeof("korean"))) { | |
313 encoding = (char *)guess_kr(str, strlen(str)); | |
314 if (!encoding) | |
315 goto fallback; | |
316 } else if(!strncasecmp("russian", det, sizeof("russian"))) { | |
317 rcd_russian_charset res = rcdGetRussianCharset(str, strlen(str)); | |
318 switch(res) { | |
319 case RUSSIAN_CHARSET_WIN: | |
320 encoding = "CP1251"; | |
321 break; | |
322 case RUSSIAN_CHARSET_ALT: | |
323 encoding = "CP866"; | |
324 break; | |
325 case RUSSIAN_CHARSET_KOI: | |
326 encoding = "KOI8-R"; | |
327 break; | |
328 case RUSSIAN_CHARSET_UTF8: | |
329 encoding = "UTF-8"; | |
330 break; | |
331 } | |
332 if (!encoding) | |
333 goto fallback; | |
334 #ifdef HAVE_UDET | |
335 } else if (!strncasecmp("universal", det, sizeof("universal"))) { | |
336 encoding = (char *)detectCharset((char *)str, strlen(str)); | |
337 if (!encoding) | |
338 goto fallback; | |
339 #endif | |
340 } else /* none, invalid */ | |
341 goto fallback; | |
342 | |
343 ret = g_convert(str, len, "UTF-8", encoding, bytes_read, bytes_write, error); | |
344 } | |
345 | |
346 fallback: | |
347 #endif | |
348 if(!ret && cfg.chardet_fallback){ | |
349 gchar **encs=NULL, **enc=NULL; | |
350 encs = g_strsplit_set(cfg.chardet_fallback, " ,:;|/", 0); | |
351 | |
352 if(encs){ | |
353 enc = encs; | |
354 for(enc=encs; *enc ; enc++){ | |
355 ret = g_convert(str, len, "UTF-8", *enc, bytes_read, bytes_write, error); | |
356 if(len == *bytes_read){ | |
357 break; | |
358 } | |
359 } | |
360 g_strfreev(encs); | |
361 } | |
362 } | |
363 | |
364 #ifdef USE_CHARDET | |
365 /* many tag libraries return 2byte latin1 utf8 character as | |
366 converted 8bit iso-8859-1 character, if they are asked to return | |
367 latin1 string. | |
368 */ | |
369 if(!ret){ | |
370 ret = g_convert(str, len, "UTF-8", "ISO-8859-1", bytes_read, bytes_write, error); | |
371 } | |
372 #endif | |
373 | |
374 if(ret){ | |
375 if(g_utf8_validate(ret, -1, NULL)) | |
376 return ret; | |
377 else { | |
378 g_free(ret); | |
379 ret = NULL; | |
380 } | |
381 } | |
382 | |
383 return NULL; /* if I have no idea, return NULL. */ | |
384 } |