comparison libpurple/util.c @ 15373:5fe8042783c1

Rename gtk/ and libgaim/ to pidgin/ and libpurple/
author Sean Egan <seanegan@gmail.com>
date Sat, 20 Jan 2007 02:32:10 +0000
parents
children 22bcaaefa478
comparison
equal deleted inserted replaced
15372:f79e0f4df793 15373:5fe8042783c1
1 /*
2 * @file util.h Utility Functions
3 * @ingroup core
4 *
5 * Gaim is the legal property of its developers, whose names are too numerous
6 * to list here. Please refer to the COPYRIGHT file distributed with this
7 * source distribution.
8 *
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License as published by
11 * the Free Software Foundation; either version 2 of the License, or
12 * (at your option) any later version.
13 *
14 * This program is distributed in the hope that it will be useful,
15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
17 * GNU General Public License for more details.
18 *
19 * You should have received a copy of the GNU General Public License
20 * along with this program; if not, write to the Free Software
21 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
22 */
23 #include "internal.h"
24
25 #include "conversation.h"
26 #include "debug.h"
27 #include "notify.h"
28 #include "prpl.h"
29 #include "prefs.h"
30 #include "util.h"
31
32 struct _GaimUtilFetchUrlData
33 {
34 GaimUtilFetchUrlCallback callback;
35 void *user_data;
36
37 struct
38 {
39 char *user;
40 char *passwd;
41 char *address;
42 int port;
43 char *page;
44
45 } website;
46
47 char *url;
48 gboolean full;
49 char *user_agent;
50 gboolean http11;
51 char *request;
52 gsize request_written;
53 gboolean include_headers;
54
55 GaimProxyConnectData *connect_data;
56 int fd;
57 guint inpa;
58
59 gboolean got_headers;
60 gboolean has_explicit_data_len;
61 char *webdata;
62 unsigned long len;
63 unsigned long data_len;
64 };
65
66 static char custom_home_dir[MAXPATHLEN];
67 static char home_dir[MAXPATHLEN];
68
69 GaimMenuAction *
70 gaim_menu_action_new(const char *label, GaimCallback callback, gpointer data,
71 GList *children)
72 {
73 GaimMenuAction *act = g_new0(GaimMenuAction, 1);
74 act->label = g_strdup(label);
75 act->callback = callback;
76 act->data = data;
77 act->children = children;
78 return act;
79 }
80
81 void
82 gaim_menu_action_free(GaimMenuAction *act)
83 {
84 g_return_if_fail(act != NULL);
85
86 g_free(act->label);
87 g_free(act);
88 }
89
90 /**************************************************************************
91 * Base16 Functions
92 **************************************************************************/
93 gchar *
94 gaim_base16_encode(const guchar *data, gsize len)
95 {
96 int i;
97 gchar *ascii = NULL;
98
99 g_return_val_if_fail(data != NULL, NULL);
100 g_return_val_if_fail(len > 0, NULL);
101
102 ascii = g_malloc(len * 2 + 1);
103
104 for (i = 0; i < len; i++)
105 snprintf(&ascii[i * 2], 3, "%02hhx", data[i]);
106
107 return ascii;
108 }
109
110 guchar *
111 gaim_base16_decode(const char *str, gsize *ret_len)
112 {
113 int len, i, accumulator = 0;
114 guchar *data;
115
116 g_return_val_if_fail(str != NULL, NULL);
117
118 len = strlen(str);
119
120 g_return_val_if_fail(strlen(str) > 0, 0);
121 g_return_val_if_fail(len % 2 == 0, 0);
122
123 data = g_malloc(len / 2);
124
125 for (i = 0; i < len; i++)
126 {
127 if ((i % 2) == 0)
128 accumulator = 0;
129 else
130 accumulator <<= 4;
131
132 if (isdigit(str[i]))
133 accumulator |= str[i] - 48;
134 else
135 {
136 switch(str[i])
137 {
138 case 'a': case 'A': accumulator |= 10; break;
139 case 'b': case 'B': accumulator |= 11; break;
140 case 'c': case 'C': accumulator |= 12; break;
141 case 'd': case 'D': accumulator |= 13; break;
142 case 'e': case 'E': accumulator |= 14; break;
143 case 'f': case 'F': accumulator |= 15; break;
144 }
145 }
146
147 if (i % 2)
148 data[(i - 1) / 2] = accumulator;
149 }
150
151 if (ret_len != NULL)
152 *ret_len = len / 2;
153
154 return data;
155 }
156
157 /**************************************************************************
158 * Base64 Functions
159 **************************************************************************/
160 static const char alphabet[] =
161 "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz"
162 "0123456789+/";
163
164 static const char xdigits[] =
165 "0123456789abcdef";
166
167 gchar *
168 gaim_base64_encode(const guchar *data, gsize len)
169 {
170 char *out, *rv;
171
172 g_return_val_if_fail(data != NULL, NULL);
173 g_return_val_if_fail(len > 0, NULL);
174
175 rv = out = g_malloc(((len/3)+1)*4 + 1);
176
177 for (; len >= 3; len -= 3)
178 {
179 *out++ = alphabet[data[0] >> 2];
180 *out++ = alphabet[((data[0] << 4) & 0x30) | (data[1] >> 4)];
181 *out++ = alphabet[((data[1] << 2) & 0x3c) | (data[2] >> 6)];
182 *out++ = alphabet[data[2] & 0x3f];
183 data += 3;
184 }
185
186 if (len > 0)
187 {
188 unsigned char fragment;
189
190 *out++ = alphabet[data[0] >> 2];
191 fragment = (data[0] << 4) & 0x30;
192
193 if (len > 1)
194 fragment |= data[1] >> 4;
195
196 *out++ = alphabet[fragment];
197 *out++ = (len < 2) ? '=' : alphabet[(data[1] << 2) & 0x3c];
198 *out++ = '=';
199 }
200
201 *out = '\0';
202
203 return rv;
204 }
205
206 guchar *
207 gaim_base64_decode(const char *str, gsize *ret_len)
208 {
209 guchar *out = NULL;
210 char tmp = 0;
211 const char *c;
212 gint32 tmp2 = 0;
213 int len = 0, n = 0;
214
215 g_return_val_if_fail(str != NULL, NULL);
216
217 c = str;
218
219 while (*c) {
220 if (*c >= 'A' && *c <= 'Z') {
221 tmp = *c - 'A';
222 } else if (*c >= 'a' && *c <= 'z') {
223 tmp = 26 + (*c - 'a');
224 } else if (*c >= '0' && *c <= 57) {
225 tmp = 52 + (*c - '0');
226 } else if (*c == '+') {
227 tmp = 62;
228 } else if (*c == '/') {
229 tmp = 63;
230 } else if (*c == '\r' || *c == '\n') {
231 c++;
232 continue;
233 } else if (*c == '=') {
234 if (n == 3) {
235 out = g_realloc(out, len + 2);
236 out[len] = (guchar)(tmp2 >> 10) & 0xff;
237 len++;
238 out[len] = (guchar)(tmp2 >> 2) & 0xff;
239 len++;
240 } else if (n == 2) {
241 out = g_realloc(out, len + 1);
242 out[len] = (guchar)(tmp2 >> 4) & 0xff;
243 len++;
244 }
245 break;
246 }
247 tmp2 = ((tmp2 << 6) | (tmp & 0xff));
248 n++;
249 if (n == 4) {
250 out = g_realloc(out, len + 3);
251 out[len] = (guchar)((tmp2 >> 16) & 0xff);
252 len++;
253 out[len] = (guchar)((tmp2 >> 8) & 0xff);
254 len++;
255 out[len] = (guchar)(tmp2 & 0xff);
256 len++;
257 tmp2 = 0;
258 n = 0;
259 }
260 c++;
261 }
262
263 out = g_realloc(out, len + 1);
264 out[len] = 0;
265
266 if (ret_len != NULL)
267 *ret_len = len;
268
269 return out;
270 }
271
272 /**************************************************************************
273 * Quoted Printable Functions (see RFC 2045).
274 **************************************************************************/
275 guchar *
276 gaim_quotedp_decode(const char *str, gsize *ret_len)
277 {
278 char *n, *new;
279 const char *end, *p;
280
281 n = new = g_malloc(strlen (str) + 1);
282 end = str + strlen(str);
283
284 for (p = str; p < end; p++, n++) {
285 if (*p == '=') {
286 if (p[1] == '\r' && p[2] == '\n') { /* 5.1 #5 */
287 n -= 1;
288 p += 2;
289 } else if (p[1] == '\n') { /* fuzzy case for 5.1 #5 */
290 n -= 1;
291 p += 1;
292 } else if (p[1] && p[2]) {
293 char *nibble1 = strchr(xdigits, tolower(p[1]));
294 char *nibble2 = strchr(xdigits, tolower(p[2]));
295 if (nibble1 && nibble2) { /* 5.1 #1 */
296 *n = ((nibble1 - xdigits) << 4) | (nibble2 - xdigits);
297 p += 2;
298 } else { /* This should never happen */
299 *n = *p;
300 }
301 } else { /* This should never happen */
302 *n = *p;
303 }
304 }
305 else if (*p == '_')
306 *n = ' ';
307 else
308 *n = *p;
309 }
310
311 *n = '\0';
312
313 if (ret_len != NULL)
314 *ret_len = n - new;
315
316 /* Resize to take less space */
317 /* new = realloc(new, n - new); */
318
319 return (guchar *)new;
320 }
321
322 /**************************************************************************
323 * MIME Functions
324 **************************************************************************/
325 char *
326 gaim_mime_decode_field(const char *str)
327 {
328 /*
329 * This is wing's version, partially based on revo/shx's version
330 * See RFC2047 [which apparently obsoletes RFC1342]
331 */
332 typedef enum {
333 state_start, state_equal1, state_question1,
334 state_charset, state_question2,
335 state_encoding, state_question3,
336 state_encoded_text, state_question4, state_equal2 = state_start
337 } encoded_word_state_t;
338 encoded_word_state_t state = state_start;
339 const char *cur, *mark;
340 const char *charset0 = NULL, *encoding0 = NULL, *encoded_text0 = NULL;
341 char *n, *new;
342
343 /* token can be any CHAR (supposedly ISO8859-1/ISO2022), not just ASCII */
344 #define token_char_p(c) \
345 (c != ' ' && !iscntrl(c) && !strchr("()<>@,;:\"/[]?.=", c))
346
347 /* But encoded-text must be ASCII; alas, isascii() may not exist */
348 #define encoded_text_char_p(c) \
349 ((c & 0x80) == 0 && c != '?' && c != ' ' && isgraph(c))
350
351 #define RECOVER_MARKED_TEXT strncpy(n, mark, cur - mark + 1); \
352 n += cur - mark + 1
353
354 g_return_val_if_fail(str != NULL, NULL);
355
356 /* NOTE: Assuming that we need just strlen(str)+1 *may* be wrong.
357 * It would be wrong if one byte (in some unknown encoding) could
358 * expand to >=4 bytes of UTF-8; I don't know if there are such things.
359 */
360 n = new = g_malloc(strlen(str) + 1);
361
362 /* Here we will be looking for encoded words and if they seem to be
363 * valid then decode them.
364 * They are of this form: =?charset?encoding?text?=
365 */
366
367 for (cur = str, mark = NULL; *cur; cur += 1) {
368 switch (state) {
369 case state_equal1:
370 if (*cur == '?') {
371 state = state_question1;
372 } else {
373 RECOVER_MARKED_TEXT;
374 state = state_start;
375 }
376 break;
377 case state_question1:
378 if (token_char_p(*cur)) {
379 charset0 = cur;
380 state = state_charset;
381 } else { /* This should never happen */
382 RECOVER_MARKED_TEXT;
383 state = state_start;
384 }
385 break;
386 case state_charset:
387 if (*cur == '?') {
388 state = state_question2;
389 } else if (!token_char_p(*cur)) { /* This should never happen */
390 RECOVER_MARKED_TEXT;
391 state = state_start;
392 }
393 break;
394 case state_question2:
395 if (token_char_p(*cur)) {
396 encoding0 = cur;
397 state = state_encoding;
398 } else { /* This should never happen */
399 RECOVER_MARKED_TEXT;
400 state = state_start;
401 }
402 break;
403 case state_encoding:
404 if (*cur == '?') {
405 state = state_question3;
406 } else if (!token_char_p(*cur)) { /* This should never happen */
407 RECOVER_MARKED_TEXT;
408 state = state_start;
409 }
410 break;
411 case state_question3:
412 if (encoded_text_char_p(*cur)) {
413 encoded_text0 = cur;
414 state = state_encoded_text;
415 } else if (*cur == '?') { /* empty string */
416 encoded_text0 = cur;
417 state = state_question4;
418 } else { /* This should never happen */
419 RECOVER_MARKED_TEXT;
420 state = state_start;
421 }
422 break;
423 case state_encoded_text:
424 if (*cur == '?') {
425 state = state_question4;
426 } else if (!encoded_text_char_p(*cur)) {
427 RECOVER_MARKED_TEXT;
428 state = state_start;
429 }
430 break;
431 case state_question4:
432 if (*cur == '=') { /* Got the whole encoded-word */
433 char *charset = g_strndup(charset0, encoding0 - charset0 - 1);
434 char *encoding = g_strndup(encoding0, encoded_text0 - encoding0 - 1);
435 char *encoded_text = g_strndup(encoded_text0, cur - encoded_text0 - 1);
436 guchar *decoded = NULL;
437 gsize dec_len;
438 if (g_ascii_strcasecmp(encoding, "Q") == 0)
439 decoded = gaim_quotedp_decode(encoded_text, &dec_len);
440 else if (g_ascii_strcasecmp(encoding, "B") == 0)
441 decoded = gaim_base64_decode(encoded_text, &dec_len);
442 else
443 decoded = NULL;
444 if (decoded) {
445 gsize len;
446 char *converted = g_convert((const gchar *)decoded, dec_len, "utf-8", charset, NULL, &len, NULL);
447
448 if (converted) {
449 n = strncpy(n, converted, len) + len;
450 g_free(converted);
451 }
452 g_free(decoded);
453 }
454 g_free(charset);
455 g_free(encoding);
456 g_free(encoded_text);
457 state = state_equal2; /* Restart the FSM */
458 } else { /* This should never happen */
459 RECOVER_MARKED_TEXT;
460 state = state_start;
461 }
462 break;
463 default:
464 if (*cur == '=') {
465 mark = cur;
466 state = state_equal1;
467 } else {
468 /* Some unencoded text. */
469 *n = *cur;
470 n += 1;
471 }
472 break;
473 } /* switch */
474 } /* for */
475
476 if (state != state_start) {
477 RECOVER_MARKED_TEXT;
478 }
479 *n = '\0';
480
481 return new;
482 }
483
484
485 /**************************************************************************
486 * Date/Time Functions
487 **************************************************************************/
488
489 #ifdef _WIN32
490 static long win32_get_tz_offset() {
491 TIME_ZONE_INFORMATION tzi;
492 DWORD ret;
493 long off = -1;
494
495 if ((ret = GetTimeZoneInformation(&tzi)) != TIME_ZONE_ID_INVALID)
496 {
497 off = -(tzi.Bias * 60);
498 if (ret == TIME_ZONE_ID_DAYLIGHT)
499 off -= tzi.DaylightBias * 60;
500 }
501
502 return off;
503 }
504 #endif
505
506 #ifndef HAVE_STRFTIME_Z_FORMAT
507 static const char *get_tmoff(const struct tm *tm)
508 {
509 static char buf[6];
510 long off;
511 gint8 min;
512 gint8 hrs;
513 struct tm new_tm = *tm;
514
515 mktime(&new_tm);
516
517 if (new_tm.tm_isdst < 0)
518 g_return_val_if_reached("");
519
520 #ifdef _WIN32
521 if ((off = win32_get_tz_offset()) == -1)
522 return "";
523 #else
524 # ifdef HAVE_TM_GMTOFF
525 off = new_tm.tm_gmtoff;
526 # else
527 # ifdef HAVE_TIMEZONE
528 tzset();
529 off = -timezone;
530 # endif /* HAVE_TIMEZONE */
531 # endif /* !HAVE_TM_GMTOFF */
532 #endif /* _WIN32 */
533
534 min = (off / 60) % 60;
535 hrs = ((off / 60) - min) / 60;
536
537 if (g_snprintf(buf, sizeof(buf), "%+03d%02d", hrs, ABS(min)) > 5)
538 g_return_val_if_reached("");
539
540 return buf;
541 }
542 #endif
543
544 /* Windows doesn't HAVE_STRFTIME_Z_FORMAT, but this seems clearer. -- rlaager */
545 #if !defined(HAVE_STRFTIME_Z_FORMAT) || defined(_WIN32)
546 static size_t gaim_internal_strftime(char *s, size_t max, const char *format, const struct tm *tm)
547 {
548 const char *start;
549 const char *c;
550 char *fmt = NULL;
551
552 /* Yes, this is checked in gaim_utf8_strftime(),
553 * but better safe than sorry. -- rlaager */
554 g_return_val_if_fail(format != NULL, 0);
555
556 /* This is fairly efficient, and it only gets
557 * executed on Windows or if the underlying
558 * system doesn't support the %z format string,
559 * for strftime() so I think it's good enough.
560 * -- rlaager */
561 for (c = start = format; *c ; c++)
562 {
563 if (*c != '%')
564 continue;
565
566 c++;
567
568 #ifndef HAVE_STRFTIME_Z_FORMAT
569 if (*c == 'z')
570 {
571 char *tmp = g_strdup_printf("%s%.*s%s",
572 fmt ? fmt : "",
573 c - start - 1,
574 start,
575 get_tmoff(tm));
576 g_free(fmt);
577 fmt = tmp;
578 start = c + 1;
579 }
580 #endif
581 #ifdef _WIN32
582 if (*c == 'Z')
583 {
584 char *tmp = g_strdup_printf("%s%.*s%s",
585 fmt ? fmt : "",
586 c - start - 1,
587 start,
588 wgaim_get_timezone_abbreviation(tm));
589 g_free(fmt);
590 fmt = tmp;
591 start = c + 1;
592 }
593 #endif
594 }
595
596 if (fmt != NULL)
597 {
598 size_t ret;
599
600 if (*start)
601 {
602 char *tmp = g_strconcat(fmt, start, NULL);
603 g_free(fmt);
604 fmt = tmp;
605 }
606
607 ret = strftime(s, max, fmt, tm);
608 g_free(fmt);
609
610 return ret;
611 }
612
613 return strftime(s, max, format, tm);
614 }
615 #else /* HAVE_STRFTIME_Z_FORMAT && !_WIN32 */
616 #define gaim_internal_strftime strftime
617 #endif
618
619 const char *
620 gaim_utf8_strftime(const char *format, const struct tm *tm)
621 {
622 static char buf[128];
623 char *locale;
624 GError *err = NULL;
625 int len;
626 char *utf8;
627
628 g_return_val_if_fail(format != NULL, NULL);
629
630 if (tm == NULL)
631 {
632 time_t now = time(NULL);
633 tm = localtime(&now);
634 }
635
636 locale = g_locale_from_utf8(format, -1, NULL, NULL, &err);
637 if (err != NULL)
638 {
639 gaim_debug_error("util", "Format conversion failed in gaim_utf8_strftime(): %s", err->message);
640 g_error_free(err);
641 locale = g_strdup(format);
642 }
643
644 /* A return value of 0 is either an error (in
645 * which case, the contents of the buffer are
646 * undefined) or the empty string (in which
647 * case, no harm is done here). */
648 if ((len = gaim_internal_strftime(buf, sizeof(buf), locale, tm)) == 0)
649 {
650 g_free(locale);
651 return "";
652 }
653
654 g_free(locale);
655
656 utf8 = g_locale_to_utf8(buf, len, NULL, NULL, &err);
657 if (err != NULL)
658 {
659 gaim_debug_error("util", "Result conversion failed in gaim_utf8_strftime(): %s", err->message);
660 g_error_free(err);
661 }
662 else
663 {
664 gaim_strlcpy(buf, utf8);
665 g_free(utf8);
666 }
667
668 return buf;
669 }
670
671 const char *
672 gaim_date_format_short(const struct tm *tm)
673 {
674 return gaim_utf8_strftime("%x", tm);
675 }
676
677 const char *
678 gaim_date_format_long(const struct tm *tm)
679 {
680 return gaim_utf8_strftime(_("%x %X"), tm);
681 }
682
683 const char *
684 gaim_date_format_full(const struct tm *tm)
685 {
686 return gaim_utf8_strftime("%c", tm);
687 }
688
689 const char *
690 gaim_time_format(const struct tm *tm)
691 {
692 return gaim_utf8_strftime("%X", tm);
693 }
694
695 time_t
696 gaim_time_build(int year, int month, int day, int hour, int min, int sec)
697 {
698 struct tm tm;
699
700 tm.tm_year = year - 1900;
701 tm.tm_mon = month - 1;
702 tm.tm_mday = day;
703 tm.tm_hour = hour;
704 tm.tm_min = min;
705 tm.tm_sec = sec >= 0 ? sec : time(NULL) % 60;
706
707 return mktime(&tm);
708 }
709
710 time_t
711 gaim_str_to_time(const char *timestamp, gboolean utc,
712 struct tm *tm, long *tz_off, const char **rest)
713 {
714 time_t retval = 0;
715 struct tm *t;
716 const char *c = timestamp;
717 int year = 0;
718 long tzoff = GAIM_NO_TZ_OFF;
719
720 time(&retval);
721 t = localtime(&retval);
722
723 /* 4 digit year */
724 if (sscanf(c, "%04d", &year) && year > 1900)
725 {
726 c += 4;
727 if (*c == '-')
728 c++;
729 t->tm_year = year - 1900;
730 }
731
732 /* 2 digit month */
733 if (!sscanf(c, "%02d", &t->tm_mon))
734 {
735 if (rest != NULL && *c != '\0')
736 *rest = c;
737 return 0;
738 }
739 c += 2;
740 if (*c == '-' || *c == '/')
741 c++;
742 t->tm_mon -= 1;
743
744 /* 2 digit day */
745 if (!sscanf(c, "%02d", &t->tm_mday))
746 {
747 if (rest != NULL && *c != '\0')
748 *rest = c;
749 return 0;
750 }
751 c += 2;
752 if (*c == '/')
753 {
754 c++;
755
756 if (!sscanf(c, "%04d", &t->tm_year))
757 {
758 if (rest != NULL && *c != '\0')
759 *rest = c;
760 return 0;
761 }
762 t->tm_year -= 1900;
763 }
764 else if (*c == 'T' || *c == '.')
765 {
766 c++;
767 /* we have more than a date, keep going */
768
769 /* 2 digit hour */
770 if ((sscanf(c, "%02d:%02d:%02d", &t->tm_hour, &t->tm_min, &t->tm_sec) == 3 && (c = c + 8)) ||
771 (sscanf(c, "%02d%02d%02d", &t->tm_hour, &t->tm_min, &t->tm_sec) == 3 && (c = c + 6)))
772 {
773 gboolean offset_positive = FALSE;
774 int tzhrs;
775 int tzmins;
776
777 t->tm_isdst = -1;
778
779 if (*c == '.' && *(c+1) >= '0' && *(c+1) <= '9') /* dealing with precision we don't care about */
780 c += 4;
781 if (*c == '+')
782 offset_positive = TRUE;
783 if (((*c == '+' || *c == '-') && (c = c + 1)) &&
784 ((sscanf(c, "%02d:%02d", &tzhrs, &tzmins) == 2 && (c = c + 5)) ||
785 (sscanf(c, "%02d%02d", &tzhrs, &tzmins) == 2 && (c = c + 4))))
786 {
787 tzoff = tzhrs*60*60 + tzmins*60;
788 if (offset_positive)
789 tzoff *= -1;
790 /* We don't want the C library doing DST calculations
791 * if we know the UTC offset already. */
792 t->tm_isdst = 0;
793 }
794 else if (utc)
795 {
796 t->tm_isdst = 0;
797 }
798
799 if (rest != NULL && *c != '\0')
800 {
801 if (*c == ' ')
802 c++;
803 if (*c != '\0')
804 *rest = c;
805 }
806
807 if (tzoff != GAIM_NO_TZ_OFF || utc)
808 {
809 #if defined(_WIN32)
810 long sys_tzoff;
811 #endif
812
813 #if defined(_WIN32) || defined(HAVE_TM_GMTOFF) || defined (HAVE_TIMEZONE)
814 if (tzoff == GAIM_NO_TZ_OFF)
815 tzoff = 0;
816 #endif
817
818 #ifdef _WIN32
819 if ((sys_tzoff = win32_get_tz_offset()) == -1)
820 tzoff = GAIM_NO_TZ_OFF;
821 else
822 tzoff += sys_tzoff;
823 #else
824 #ifdef HAVE_TM_GMTOFF
825 tzoff += t->tm_gmtoff;
826 #else
827 # ifdef HAVE_TIMEZONE
828 tzset(); /* making sure */
829 tzoff -= timezone;
830 # endif
831 #endif
832 #endif /* _WIN32 */
833 }
834 }
835 else
836 {
837 if (rest != NULL && *c != '\0')
838 *rest = c;
839 }
840 }
841
842 if (tm != NULL)
843 {
844 *tm = *t;
845 tm->tm_isdst = -1;
846 mktime(tm);
847 }
848
849 retval = mktime(t);
850 if (tzoff != GAIM_NO_TZ_OFF)
851 retval += tzoff;
852
853 if (tz_off != NULL)
854 *tz_off = tzoff;
855
856 return retval;
857 }
858
859 /**************************************************************************
860 * Markup Functions
861 **************************************************************************/
862
863 /* Returns a NULL-terminated string after unescaping an entity
864 * (eg. &amp;, &lt; &#38 etc.) starting at s. Returns NULL on failure.*/
865 static const char *
866 detect_entity(const char *text, int *length)
867 {
868 const char *pln;
869 int len, pound;
870
871 if (!text || *text != '&')
872 return NULL;
873
874 #define IS_ENTITY(s) (!g_ascii_strncasecmp(text, s, (len = sizeof(s) - 1)))
875
876 if(IS_ENTITY("&amp;"))
877 pln = "&";
878 else if(IS_ENTITY("&lt;"))
879 pln = "<";
880 else if(IS_ENTITY("&gt;"))
881 pln = ">";
882 else if(IS_ENTITY("&nbsp;"))
883 pln = " ";
884 else if(IS_ENTITY("&copy;"))
885 pln = "\302\251"; /* or use g_unichar_to_utf8(0xa9); */
886 else if(IS_ENTITY("&quot;"))
887 pln = "\"";
888 else if(IS_ENTITY("&reg;"))
889 pln = "\302\256"; /* or use g_unichar_to_utf8(0xae); */
890 else if(IS_ENTITY("&apos;"))
891 pln = "\'";
892 else if(*(text+1) == '#' && (sscanf(text, "&#%u;", &pound) == 1) &&
893 pound != 0 && *(text+3+(gint)log10(pound)) == ';') {
894 static char buf[7];
895 int buflen = g_unichar_to_utf8((gunichar)pound, buf);
896 buf[buflen] = '\0';
897 pln = buf;
898
899 len = 2;
900 while(isdigit((gint) text[len])) len++;
901 if(text[len] == ';') len++;
902 }
903 else
904 return NULL;
905
906 if (length)
907 *length = len;
908 return pln;
909 }
910
911 gboolean
912 gaim_markup_find_tag(const char *needle, const char *haystack,
913 const char **start, const char **end, GData **attributes)
914 {
915 GData *attribs;
916 const char *cur = haystack;
917 char *name = NULL;
918 gboolean found = FALSE;
919 gboolean in_tag = FALSE;
920 gboolean in_attr = FALSE;
921 const char *in_quotes = NULL;
922 size_t needlelen;
923
924 g_return_val_if_fail( needle != NULL, FALSE);
925 g_return_val_if_fail( *needle != '\0', FALSE);
926 g_return_val_if_fail( haystack != NULL, FALSE);
927 g_return_val_if_fail( *haystack != '\0', FALSE);
928 g_return_val_if_fail( start != NULL, FALSE);
929 g_return_val_if_fail( end != NULL, FALSE);
930 g_return_val_if_fail(attributes != NULL, FALSE);
931
932 needlelen = strlen(needle);
933 g_datalist_init(&attribs);
934
935 while (*cur && !found) {
936 if (in_tag) {
937 if (in_quotes) {
938 const char *close = cur;
939
940 while (*close && *close != *in_quotes)
941 close++;
942
943 /* if we got the close quote, store the value and carry on from *
944 * after it. if we ran to the end of the string, point to the NULL *
945 * and we're outta here */
946 if (*close) {
947 /* only store a value if we have an attribute name */
948 if (name) {
949 size_t len = close - cur;
950 char *val = g_strndup(cur, len);
951
952 g_datalist_set_data_full(&attribs, name, val, g_free);
953 g_free(name);
954 name = NULL;
955 }
956
957 in_quotes = NULL;
958 cur = close + 1;
959 } else {
960 cur = close;
961 }
962 } else if (in_attr) {
963 const char *close = cur;
964
965 while (*close && *close != '>' && *close != '"' &&
966 *close != '\'' && *close != ' ' && *close != '=')
967 close++;
968
969 /* if we got the equals, store the name of the attribute. if we got
970 * the quote, save the attribute and go straight to quote mode.
971 * otherwise the tag closed or we reached the end of the string,
972 * so we can get outta here */
973 switch (*close) {
974 case '"':
975 case '\'':
976 in_quotes = close;
977 case '=':
978 {
979 size_t len = close - cur;
980
981 /* don't store a blank attribute name */
982 if (len) {
983 g_free(name);
984 name = g_ascii_strdown(cur, len);
985 }
986
987 in_attr = FALSE;
988 cur = close + 1;
989 break;
990 }
991 case ' ':
992 case '>':
993 in_attr = FALSE;
994 default:
995 cur = close;
996 break;
997 }
998 } else {
999 switch (*cur) {
1000 case ' ':
1001 /* swallow extra spaces inside tag */
1002 while (*cur && *cur == ' ') cur++;
1003 in_attr = TRUE;
1004 break;
1005 case '>':
1006 found = TRUE;
1007 *end = cur;
1008 break;
1009 case '"':
1010 case '\'':
1011 in_quotes = cur;
1012 default:
1013 cur++;
1014 break;
1015 }
1016 }
1017 } else {
1018 /* if we hit a < followed by the name of our tag... */
1019 if (*cur == '<' && !g_ascii_strncasecmp(cur + 1, needle, needlelen)) {
1020 *start = cur;
1021 cur = cur + needlelen + 1;
1022
1023 /* if we're pointing at a space or a >, we found the right tag. if *
1024 * we're not, we've found a longer tag, so we need to skip to the *
1025 * >, but not being distracted by >s inside quotes. */
1026 if (*cur == ' ' || *cur == '>') {
1027 in_tag = TRUE;
1028 } else {
1029 while (*cur && *cur != '"' && *cur != '\'' && *cur != '>') {
1030 if (*cur == '"') {
1031 cur++;
1032 while (*cur && *cur != '"')
1033 cur++;
1034 } else if (*cur == '\'') {
1035 cur++;
1036 while (*cur && *cur != '\'')
1037 cur++;
1038 } else {
1039 cur++;
1040 }
1041 }
1042 }
1043 } else {
1044 cur++;
1045 }
1046 }
1047 }
1048
1049 /* clean up any attribute name from a premature termination */
1050 g_free(name);
1051
1052 if (found) {
1053 *attributes = attribs;
1054 } else {
1055 *start = NULL;
1056 *end = NULL;
1057 *attributes = NULL;
1058 }
1059
1060 return found;
1061 }
1062
1063 gboolean
1064 gaim_markup_extract_info_field(const char *str, int len, GaimNotifyUserInfo *user_info,
1065 const char *start_token, int skip,
1066 const char *end_token, char check_value,
1067 const char *no_value_token,
1068 const char *display_name, gboolean is_link,
1069 const char *link_prefix,
1070 GaimInfoFieldFormatCallback format_cb)
1071 {
1072 const char *p, *q;
1073
1074 g_return_val_if_fail(str != NULL, FALSE);
1075 g_return_val_if_fail(user_info != NULL, FALSE);
1076 g_return_val_if_fail(start_token != NULL, FALSE);
1077 g_return_val_if_fail(end_token != NULL, FALSE);
1078 g_return_val_if_fail(display_name != NULL, FALSE);
1079
1080 p = strstr(str, start_token);
1081
1082 if (p == NULL)
1083 return FALSE;
1084
1085 p += strlen(start_token) + skip;
1086
1087 if (p >= str + len)
1088 return FALSE;
1089
1090 if (check_value != '\0' && *p == check_value)
1091 return FALSE;
1092
1093 q = strstr(p, end_token);
1094
1095 /* Trim leading blanks */
1096 while (*p != '\n' && g_ascii_isspace(*p)) {
1097 p += 1;
1098 }
1099
1100 /* Trim trailing blanks */
1101 while (q > p && g_ascii_isspace(*(q - 1))) {
1102 q -= 1;
1103 }
1104
1105 /* Don't bother with null strings */
1106 if (p == q)
1107 return FALSE;
1108
1109 if (q != NULL && (!no_value_token ||
1110 (no_value_token && strncmp(p, no_value_token,
1111 strlen(no_value_token)))))
1112 {
1113 GString *dest = g_string_new("");
1114
1115 if (is_link)
1116 {
1117 g_string_append(dest, "<a href=\"");
1118
1119 if (link_prefix)
1120 g_string_append(dest, link_prefix);
1121
1122 if (format_cb != NULL)
1123 {
1124 char *reformatted = format_cb(p, q - p);
1125 g_string_append(dest, reformatted);
1126 g_free(reformatted);
1127 }
1128 else
1129 g_string_append_len(dest, p, q - p);
1130 g_string_append(dest, "\">");
1131
1132 if (link_prefix)
1133 g_string_append(dest, link_prefix);
1134
1135 g_string_append_len(dest, p, q - p);
1136 g_string_append(dest, "</a>");
1137 }
1138 else
1139 {
1140 if (format_cb != NULL)
1141 {
1142 char *reformatted = format_cb(p, q - p);
1143 g_string_append(dest, reformatted);
1144 g_free(reformatted);
1145 }
1146 else
1147 g_string_append_len(dest, p, q - p);
1148 }
1149
1150 gaim_notify_user_info_add_pair(user_info, display_name, dest->str);
1151 g_string_free(dest, TRUE);
1152
1153 return TRUE;
1154 }
1155
1156 return FALSE;
1157 }
1158
1159 struct gaim_parse_tag {
1160 char *src_tag;
1161 char *dest_tag;
1162 gboolean ignore;
1163 };
1164
1165 #define ALLOW_TAG_ALT(x, y) if(!g_ascii_strncasecmp(c, "<" x " ", strlen("<" x " "))) { \
1166 const char *o = c + strlen("<" x); \
1167 const char *p = NULL, *q = NULL, *r = NULL; \
1168 GString *innards = g_string_new(""); \
1169 while(o && *o) { \
1170 if(!q && (*o == '\"' || *o == '\'') ) { \
1171 q = o; \
1172 } else if(q) { \
1173 if(*o == *q) { \
1174 char *unescaped = g_strndup(q+1, o-q-1); \
1175 char *escaped = g_markup_escape_text(unescaped, -1); \
1176 g_string_append_printf(innards, "%c%s%c", *q, escaped, *q); \
1177 g_free(unescaped); \
1178 g_free(escaped); \
1179 q = NULL; \
1180 } else if(*c == '\\') { \
1181 o++; \
1182 } \
1183 } else if(*o == '<') { \
1184 r = o; \
1185 } else if(*o == '>') { \
1186 p = o; \
1187 break; \
1188 } else { \
1189 innards = g_string_append_c(innards, *o); \
1190 } \
1191 o++; \
1192 } \
1193 if(p && !r) { \
1194 if(*(p-1) != '/') { \
1195 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1); \
1196 pt->src_tag = x; \
1197 pt->dest_tag = y; \
1198 tags = g_list_prepend(tags, pt); \
1199 } \
1200 xhtml = g_string_append(xhtml, "<" y); \
1201 c += strlen("<" x ); \
1202 xhtml = g_string_append(xhtml, innards->str); \
1203 xhtml = g_string_append_c(xhtml, '>'); \
1204 c = p + 1; \
1205 } else { \
1206 xhtml = g_string_append(xhtml, "&lt;"); \
1207 plain = g_string_append_c(plain, '<'); \
1208 c++; \
1209 } \
1210 g_string_free(innards, TRUE); \
1211 continue; \
1212 } \
1213 if(!g_ascii_strncasecmp(c, "<" x, strlen("<" x)) && \
1214 (*(c+strlen("<" x)) == '>' || \
1215 !g_ascii_strncasecmp(c+strlen("<" x), "/>", 2))) { \
1216 xhtml = g_string_append(xhtml, "<" y); \
1217 c += strlen("<" x); \
1218 if(*c != '/') { \
1219 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1); \
1220 pt->src_tag = x; \
1221 pt->dest_tag = y; \
1222 tags = g_list_prepend(tags, pt); \
1223 xhtml = g_string_append_c(xhtml, '>'); \
1224 } else { \
1225 xhtml = g_string_append(xhtml, "/>");\
1226 } \
1227 c = strchr(c, '>') + 1; \
1228 continue; \
1229 }
1230 #define ALLOW_TAG(x) ALLOW_TAG_ALT(x, x)
1231 void
1232 gaim_markup_html_to_xhtml(const char *html, char **xhtml_out,
1233 char **plain_out)
1234 {
1235 GString *xhtml = g_string_new("");
1236 GString *plain = g_string_new("");
1237 GList *tags = NULL, *tag;
1238 const char *c = html;
1239
1240 while(c && *c) {
1241 if(*c == '<') {
1242 if(*(c+1) == '/') { /* closing tag */
1243 tag = tags;
1244 while(tag) {
1245 struct gaim_parse_tag *pt = tag->data;
1246 if(!g_ascii_strncasecmp((c+2), pt->src_tag, strlen(pt->src_tag)) && *(c+strlen(pt->src_tag)+2) == '>') {
1247 c += strlen(pt->src_tag) + 3;
1248 break;
1249 }
1250 tag = tag->next;
1251 }
1252 if(tag) {
1253 while(tags) {
1254 struct gaim_parse_tag *pt = tags->data;
1255 g_string_append_printf(xhtml, "</%s>", pt->dest_tag);
1256 if(tags == tag)
1257 break;
1258 tags = g_list_remove(tags, pt);
1259 g_free(pt);
1260 }
1261 g_free(tag->data);
1262 tags = g_list_remove(tags, tag->data);
1263 } else {
1264 /* a closing tag we weren't expecting...
1265 * we'll let it slide, if it's really a tag...if it's
1266 * just a </ we'll escape it properly */
1267 const char *end = c+2;
1268 while(*end && g_ascii_isalpha(*end))
1269 end++;
1270 if(*end == '>') {
1271 c = end+1;
1272 } else {
1273 xhtml = g_string_append(xhtml, "&lt;");
1274 plain = g_string_append_c(plain, '<');
1275 c++;
1276 }
1277 }
1278 } else { /* opening tag */
1279 ALLOW_TAG("a");
1280 ALLOW_TAG("blockquote");
1281 ALLOW_TAG("cite");
1282 ALLOW_TAG("div");
1283 ALLOW_TAG("em");
1284 ALLOW_TAG("h1");
1285 ALLOW_TAG("h2");
1286 ALLOW_TAG("h3");
1287 ALLOW_TAG("h4");
1288 ALLOW_TAG("h5");
1289 ALLOW_TAG("h6");
1290 /* we only allow html to start the message */
1291 if(c == html)
1292 ALLOW_TAG("html");
1293 ALLOW_TAG_ALT("i", "em");
1294 ALLOW_TAG_ALT("italic", "em");
1295 ALLOW_TAG("li");
1296 ALLOW_TAG("ol");
1297 ALLOW_TAG("p");
1298 ALLOW_TAG("pre");
1299 ALLOW_TAG("q");
1300 ALLOW_TAG("span");
1301 ALLOW_TAG("strong");
1302 ALLOW_TAG("ul");
1303
1304 /* we skip <HR> because it's not legal in XHTML-IM. However,
1305 * we still want to send something sensible, so we put a
1306 * linebreak in its place. <BR> also needs special handling
1307 * because putting a </BR> to close it would just be dumb. */
1308 if((!g_ascii_strncasecmp(c, "<br", 3)
1309 || !g_ascii_strncasecmp(c, "<hr", 3))
1310 && (*(c+3) == '>' ||
1311 !g_ascii_strncasecmp(c+3, "/>", 2) ||
1312 !g_ascii_strncasecmp(c+3, " />", 3))) {
1313 c = strchr(c, '>') + 1;
1314 xhtml = g_string_append(xhtml, "<br/>");
1315 if(*c != '\n')
1316 plain = g_string_append_c(plain, '\n');
1317 continue;
1318 }
1319 if(!g_ascii_strncasecmp(c, "<b>", 3) || !g_ascii_strncasecmp(c, "<bold>", strlen("<bold>"))) {
1320 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1321 pt->src_tag = *(c+2) == '>' ? "b" : "bold";
1322 pt->dest_tag = "span";
1323 tags = g_list_prepend(tags, pt);
1324 c = strchr(c, '>') + 1;
1325 xhtml = g_string_append(xhtml, "<span style='font-weight: bold;'>");
1326 continue;
1327 }
1328 if(!g_ascii_strncasecmp(c, "<u>", 3) || !g_ascii_strncasecmp(c, "<underline>", strlen("<underline>"))) {
1329 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1330 pt->src_tag = *(c+2) == '>' ? "u" : "underline";
1331 pt->dest_tag = "span";
1332 tags = g_list_prepend(tags, pt);
1333 c = strchr(c, '>') + 1;
1334 xhtml = g_string_append(xhtml, "<span style='text-decoration: underline;'>");
1335 continue;
1336 }
1337 if(!g_ascii_strncasecmp(c, "<s>", 3) || !g_ascii_strncasecmp(c, "<strike>", strlen("<strike>"))) {
1338 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1339 pt->src_tag = *(c+2) == '>' ? "s" : "strike";
1340 pt->dest_tag = "span";
1341 tags = g_list_prepend(tags, pt);
1342 c = strchr(c, '>') + 1;
1343 xhtml = g_string_append(xhtml, "<span style='text-decoration: line-through;'>");
1344 continue;
1345 }
1346 if(!g_ascii_strncasecmp(c, "<sub>", 5)) {
1347 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1348 pt->src_tag = "sub";
1349 pt->dest_tag = "span";
1350 tags = g_list_prepend(tags, pt);
1351 c = strchr(c, '>') + 1;
1352 xhtml = g_string_append(xhtml, "<span style='vertical-align:sub;'>");
1353 continue;
1354 }
1355 if(!g_ascii_strncasecmp(c, "<sup>", 5)) {
1356 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1357 pt->src_tag = "sup";
1358 pt->dest_tag = "span";
1359 tags = g_list_prepend(tags, pt);
1360 c = strchr(c, '>') + 1;
1361 xhtml = g_string_append(xhtml, "<span style='vertical-align:super;'>");
1362 continue;
1363 }
1364 if(!g_ascii_strncasecmp(c, "<font", 5) && (*(c+5) == '>' || *(c+5) == ' ')) {
1365 const char *p = c;
1366 GString *style = g_string_new("");
1367 struct gaim_parse_tag *pt;
1368 while(*p && *p != '>') {
1369 if(!g_ascii_strncasecmp(p, "back=", strlen("back="))) {
1370 const char *q = p + strlen("back=");
1371 GString *color = g_string_new("");
1372 if(*q == '\'' || *q == '\"')
1373 q++;
1374 while(*q && *q != '\"' && *q != '\'' && *q != ' ') {
1375 color = g_string_append_c(color, *q);
1376 q++;
1377 }
1378 g_string_append_printf(style, "background: %s; ", color->str);
1379 g_string_free(color, TRUE);
1380 p = q;
1381 } else if(!g_ascii_strncasecmp(p, "color=", strlen("color="))) {
1382 const char *q = p + strlen("color=");
1383 GString *color = g_string_new("");
1384 if(*q == '\'' || *q == '\"')
1385 q++;
1386 while(*q && *q != '\"' && *q != '\'' && *q != ' ') {
1387 color = g_string_append_c(color, *q);
1388 q++;
1389 }
1390 g_string_append_printf(style, "color: %s; ", color->str);
1391 g_string_free(color, TRUE);
1392 p = q;
1393 } else if(!g_ascii_strncasecmp(p, "face=", strlen("face="))) {
1394 const char *q = p + strlen("face=");
1395 gboolean space_allowed = FALSE;
1396 GString *face = g_string_new("");
1397 if(*q == '\'' || *q == '\"') {
1398 space_allowed = TRUE;
1399 q++;
1400 }
1401 while(*q && *q != '\"' && *q != '\'' && (space_allowed || *q != ' ')) {
1402 face = g_string_append_c(face, *q);
1403 q++;
1404 }
1405 g_string_append_printf(style, "font-family: %s; ", g_strstrip(face->str));
1406 g_string_free(face, TRUE);
1407 p = q;
1408 } else if(!g_ascii_strncasecmp(p, "size=", strlen("size="))) {
1409 const char *q = p + strlen("size=");
1410 int sz;
1411 const char *size = "medium";
1412 if(*q == '\'' || *q == '\"')
1413 q++;
1414 sz = atoi(q);
1415 switch (sz)
1416 {
1417 case 1:
1418 size = "xx-small";
1419 break;
1420 case 2:
1421 size = "x-small";
1422 break;
1423 case 3:
1424 size = "small";
1425 break;
1426 case 4:
1427 size = "medium";
1428 break;
1429 case 5:
1430 size = "large";
1431 break;
1432 case 6:
1433 size = "x-large";
1434 break;
1435 case 7:
1436 size = "xx-large";
1437 break;
1438 default:
1439 break;
1440 }
1441 g_string_append_printf(style, "font-size: %s; ", size);
1442 p = q;
1443 }
1444 p++;
1445 }
1446 if ((c = strchr(c, '>')) != NULL)
1447 c++;
1448 else
1449 c = p;
1450 pt = g_new0(struct gaim_parse_tag, 1);
1451 pt->src_tag = "font";
1452 pt->dest_tag = "span";
1453 tags = g_list_prepend(tags, pt);
1454 if(style->len)
1455 g_string_append_printf(xhtml, "<span style='%s'>", g_strstrip(style->str));
1456 else
1457 pt->ignore = TRUE;
1458 g_string_free(style, TRUE);
1459 continue;
1460 }
1461 if(!g_ascii_strncasecmp(c, "<body ", 6)) {
1462 const char *p = c;
1463 gboolean did_something = FALSE;
1464 while(*p && *p != '>') {
1465 if(!g_ascii_strncasecmp(p, "bgcolor=", strlen("bgcolor="))) {
1466 const char *q = p + strlen("bgcolor=");
1467 struct gaim_parse_tag *pt = g_new0(struct gaim_parse_tag, 1);
1468 GString *color = g_string_new("");
1469 if(*q == '\'' || *q == '\"')
1470 q++;
1471 while(*q && *q != '\"' && *q != '\'' && *q != ' ') {
1472 color = g_string_append_c(color, *q);
1473 q++;
1474 }
1475 g_string_append_printf(xhtml, "<span style='background: %s;'>", g_strstrip(color->str));
1476 g_string_free(color, TRUE);
1477 if ((c = strchr(c, '>')) != NULL)
1478 c++;
1479 else
1480 c = p;
1481 pt->src_tag = "body";
1482 pt->dest_tag = "span";
1483 tags = g_list_prepend(tags, pt);
1484 did_something = TRUE;
1485 break;
1486 }
1487 p++;
1488 }
1489 if(did_something) continue;
1490 }
1491 /* this has to come after the special case for bgcolor */
1492 ALLOW_TAG("body");
1493 if(!g_ascii_strncasecmp(c, "<!--", strlen("<!--"))) {
1494 char *p = strstr(c + strlen("<!--"), "-->");
1495 if(p) {
1496 xhtml = g_string_append(xhtml, "<!--");
1497 c += strlen("<!--");
1498 continue;
1499 }
1500 }
1501
1502 xhtml = g_string_append(xhtml, "&lt;");
1503 plain = g_string_append_c(plain, '<');
1504 c++;
1505 }
1506 } else if(*c == '&') {
1507 char buf[7];
1508 const char *pln;
1509 int len;
1510
1511 if ((pln = detect_entity(c, &len)) == NULL) {
1512 len = 1;
1513 g_snprintf(buf, sizeof(buf), "%c", *c);
1514 pln = buf;
1515 }
1516 xhtml = g_string_append_len(xhtml, c, len);
1517 plain = g_string_append(plain, pln);
1518 c += len;
1519 } else {
1520 xhtml = g_string_append_c(xhtml, *c);
1521 plain = g_string_append_c(plain, *c);
1522 c++;
1523 }
1524 }
1525 tag = tags;
1526 while(tag) {
1527 struct gaim_parse_tag *pt = tag->data;
1528 if(!pt->ignore)
1529 g_string_append_printf(xhtml, "</%s>", pt->dest_tag);
1530 tag = tag->next;
1531 }
1532 g_list_free(tags);
1533 if(xhtml_out)
1534 *xhtml_out = g_strdup(xhtml->str);
1535 if(plain_out)
1536 *plain_out = g_strdup(plain->str);
1537 g_string_free(xhtml, TRUE);
1538 g_string_free(plain, TRUE);
1539 }
1540
1541 /* The following are probably reasonable changes:
1542 * - \n should be converted to a normal space
1543 * - in addition to <br>, <p> and <div> etc. should also be converted into \n
1544 * - We want to turn </td>#whitespace<td> sequences into a single tab
1545 * - We want to turn <td> into a single tab (for msn profile "parsing")
1546 * - We want to turn </tr>#whitespace<tr> sequences into a single \n
1547 * - <script>...</script> and <style>...</style> should be completely removed
1548 */
1549
1550 char *
1551 gaim_markup_strip_html(const char *str)
1552 {
1553 int i, j, k, entlen;
1554 gboolean visible = TRUE;
1555 gboolean closing_td_p = FALSE;
1556 gchar *str2;
1557 const gchar *cdata_close_tag = NULL, *ent;
1558 gchar *href = NULL;
1559 int href_st = 0;
1560
1561 if(!str)
1562 return NULL;
1563
1564 str2 = g_strdup(str);
1565
1566 for (i = 0, j = 0; str2[i]; i++)
1567 {
1568 if (str2[i] == '<')
1569 {
1570 if (cdata_close_tag)
1571 {
1572 /* Note: Don't even assume any other tag is a tag in CDATA */
1573 if (strncasecmp(str2 + i, cdata_close_tag,
1574 strlen(cdata_close_tag)) == 0)
1575 {
1576 i += strlen(cdata_close_tag) - 1;
1577 cdata_close_tag = NULL;
1578 }
1579 continue;
1580 }
1581 else if (strncasecmp(str2 + i, "<td", 3) == 0 && closing_td_p)
1582 {
1583 str2[j++] = '\t';
1584 visible = TRUE;
1585 }
1586 else if (strncasecmp(str2 + i, "</td>", 5) == 0)
1587 {
1588 closing_td_p = TRUE;
1589 visible = FALSE;
1590 }
1591 else
1592 {
1593 closing_td_p = FALSE;
1594 visible = TRUE;
1595 }
1596
1597 k = i + 1;
1598
1599 if(g_ascii_isspace(str2[k]))
1600 visible = TRUE;
1601 else if (str2[k])
1602 {
1603 /* Scan until we end the tag either implicitly (closed start
1604 * tag) or explicitly, using a sloppy method (i.e., < or >
1605 * inside quoted attributes will screw us up)
1606 */
1607 while (str2[k] && str2[k] != '<' && str2[k] != '>')
1608 {
1609 k++;
1610 }
1611
1612 /* If we've got an <a> tag with an href, save the address
1613 * to print later. */
1614 if (strncasecmp(str2 + i, "<a", 2) == 0 &&
1615 g_ascii_isspace(str2[i+2]))
1616 {
1617 int st; /* start of href, inclusive [ */
1618 int end; /* end of href, exclusive ) */
1619 char delim = ' ';
1620 /* Find start of href */
1621 for (st = i + 3; st < k; st++)
1622 {
1623 if (strncasecmp(str2+st, "href=", 5) == 0)
1624 {
1625 st += 5;
1626 if (str2[st] == '"')
1627 {
1628 delim = '"';
1629 st++;
1630 }
1631 break;
1632 }
1633 }
1634 /* find end of address */
1635 for (end = st; end < k && str2[end] != delim; end++)
1636 {
1637 /* All the work is done in the loop construct above. */
1638 }
1639
1640 /* If there's an address, save it. If there was
1641 * already one saved, kill it. */
1642 if (st < k)
1643 {
1644 char *tmp;
1645 g_free(href);
1646 tmp = g_strndup(str2 + st, end - st);
1647 href = gaim_unescape_html(tmp);
1648 g_free(tmp);
1649 href_st = j;
1650 }
1651 }
1652
1653 /* Replace </a> with an ascii representation of the
1654 * address the link was pointing to. */
1655 else if (href != NULL && strncasecmp(str2 + i, "</a>", 4) == 0)
1656 {
1657
1658 size_t hrlen = strlen(href);
1659
1660 /* Only insert the href if it's different from the CDATA. */
1661 if ((hrlen != j - href_st ||
1662 strncmp(str2 + href_st, href, hrlen)) &&
1663 (hrlen != j - href_st + 7 || /* 7 == strlen("http://") */
1664 strncmp(str2 + href_st, href + 7, hrlen - 7)))
1665 {
1666 str2[j++] = ' ';
1667 str2[j++] = '(';
1668 g_memmove(str2 + j, href, hrlen);
1669 j += hrlen;
1670 str2[j++] = ')';
1671 g_free(href);
1672 href = NULL;
1673 }
1674 }
1675
1676 /* Check for tags which should be mapped to newline */
1677 else if (strncasecmp(str2 + i, "<p>", 3) == 0
1678 || strncasecmp(str2 + i, "<tr", 3) == 0
1679 || strncasecmp(str2 + i, "<br", 3) == 0
1680 || strncasecmp(str2 + i, "<li", 3) == 0
1681 || strncasecmp(str2 + i, "<div", 4) == 0
1682 || strncasecmp(str2 + i, "</table>", 8) == 0)
1683 {
1684 str2[j++] = '\n';
1685 }
1686 /* Check for tags which begin CDATA and need to be closed */
1687 #if 0 /* FIXME.. option is end tag optional, we can't handle this right now */
1688 else if (strncasecmp(str2 + i, "<option", 7) == 0)
1689 {
1690 /* FIXME: We should not do this if the OPTION is SELECT'd */
1691 cdata_close_tag = "</option>";
1692 }
1693 #endif
1694 else if (strncasecmp(str2 + i, "<script", 7) == 0)
1695 {
1696 cdata_close_tag = "</script>";
1697 }
1698 else if (strncasecmp(str2 + i, "<style", 6) == 0)
1699 {
1700 cdata_close_tag = "</style>";
1701 }
1702 /* Update the index and continue checking after the tag */
1703 i = (str2[k] == '<' || str2[k] == '\0')? k - 1: k;
1704 continue;
1705 }
1706 }
1707 else if (cdata_close_tag)
1708 {
1709 continue;
1710 }
1711 else if (!g_ascii_isspace(str2[i]))
1712 {
1713 visible = TRUE;
1714 }
1715
1716 if (str2[i] == '&' && (ent = detect_entity(str2 + i, &entlen)) != NULL)
1717 {
1718 while (*ent)
1719 str2[j++] = *ent++;
1720 i += entlen - 1;
1721 continue;
1722 }
1723
1724 if (visible)
1725 str2[j++] = g_ascii_isspace(str2[i])? ' ': str2[i];
1726 }
1727
1728 g_free(href);
1729
1730 str2[j] = '\0';
1731
1732 return str2;
1733 }
1734
1735 static gboolean
1736 badchar(char c)
1737 {
1738 switch (c) {
1739 case ' ':
1740 case ',':
1741 case '\0':
1742 case '\n':
1743 case '\r':
1744 case '<':
1745 case '>':
1746 case '"':
1747 case '\'':
1748 return TRUE;
1749 default:
1750 return FALSE;
1751 }
1752 }
1753
1754 static gboolean
1755 badentity(const char *c)
1756 {
1757 if (!g_ascii_strncasecmp(c, "&lt;", 4) ||
1758 !g_ascii_strncasecmp(c, "&gt;", 4) ||
1759 !g_ascii_strncasecmp(c, "&quot;", 6)) {
1760 return TRUE;
1761 }
1762 return FALSE;
1763 }
1764
1765 char *
1766 gaim_markup_linkify(const char *text)
1767 {
1768 const char *c, *t, *q = NULL;
1769 char *tmpurlbuf, *url_buf;
1770 gunichar g;
1771 gboolean inside_html = FALSE;
1772 int inside_paren = 0;
1773 GString *ret = g_string_new("");
1774 /* Assumes you have a buffer able to carry at least BUF_LEN * 2 bytes */
1775
1776 c = text;
1777 while (*c) {
1778
1779 if(*c == '(' && !inside_html) {
1780 inside_paren++;
1781 ret = g_string_append_c(ret, *c);
1782 c++;
1783 }
1784
1785 if(inside_html) {
1786 if(*c == '>') {
1787 inside_html = FALSE;
1788 } else if(!q && (*c == '\"' || *c == '\'')) {
1789 q = c;
1790 } else if(q) {
1791 if(*c == *q)
1792 q = NULL;
1793 }
1794 } else if(*c == '<') {
1795 inside_html = TRUE;
1796 if (!g_ascii_strncasecmp(c, "<A", 2)) {
1797 while (1) {
1798 if (!g_ascii_strncasecmp(c, "/A>", 3)) {
1799 inside_html = FALSE;
1800 break;
1801 }
1802 ret = g_string_append_c(ret, *c);
1803 c++;
1804 if (!(*c))
1805 break;
1806 }
1807 }
1808 } else if ((*c=='h') && (!g_ascii_strncasecmp(c, "http://", 7) ||
1809 (!g_ascii_strncasecmp(c, "https://", 8)))) {
1810 t = c;
1811 while (1) {
1812 if (badchar(*t) || badentity(t)) {
1813
1814 if (*(t) == ',' && (*(t + 1) != ' ')) {
1815 t++;
1816 continue;
1817 }
1818
1819 if (*(t - 1) == '.')
1820 t--;
1821 if ((*(t - 1) == ')' && (inside_paren > 0))) {
1822 t--;
1823 }
1824
1825 url_buf = g_strndup(c, t - c);
1826 tmpurlbuf = gaim_unescape_html(url_buf);
1827 g_string_append_printf(ret, "<A HREF=\"%s\">%s</A>",
1828 tmpurlbuf, url_buf);
1829 g_free(url_buf);
1830 g_free(tmpurlbuf);
1831 c = t;
1832 break;
1833 }
1834 t++;
1835
1836 }
1837 } else if (!g_ascii_strncasecmp(c, "www.", 4) && (c == text || badchar(c[-1]) || badentity(c-1))) {
1838 if (c[4] != '.') {
1839 t = c;
1840 while (1) {
1841 if (badchar(*t) || badentity(t)) {
1842 if (t - c == 4) {
1843 break;
1844 }
1845
1846 if (*(t) == ',' && (*(t + 1) != ' ')) {
1847 t++;
1848 continue;
1849 }
1850
1851 if (*(t - 1) == '.')
1852 t--;
1853 if ((*(t - 1) == ')' && (inside_paren > 0))) {
1854 t--;
1855 }
1856 url_buf = g_strndup(c, t - c);
1857 tmpurlbuf = gaim_unescape_html(url_buf);
1858 g_string_append_printf(ret,
1859 "<A HREF=\"http://%s\">%s</A>", tmpurlbuf,
1860 url_buf);
1861 g_free(url_buf);
1862 g_free(tmpurlbuf);
1863 c = t;
1864 break;
1865 }
1866 t++;
1867 }
1868 }
1869 } else if (!g_ascii_strncasecmp(c, "ftp://", 6) || !g_ascii_strncasecmp(c, "sftp://", 7)) {
1870 t = c;
1871 while (1) {
1872 if (badchar(*t) || badentity(t)) {
1873 if (*(t - 1) == '.')
1874 t--;
1875 if ((*(t - 1) == ')' && (inside_paren > 0))) {
1876 t--;
1877 }
1878 url_buf = g_strndup(c, t - c);
1879 tmpurlbuf = gaim_unescape_html(url_buf);
1880 g_string_append_printf(ret, "<A HREF=\"%s\">%s</A>",
1881 tmpurlbuf, url_buf);
1882 g_free(url_buf);
1883 g_free(tmpurlbuf);
1884 c = t;
1885 break;
1886 }
1887 if (!t)
1888 break;
1889 t++;
1890
1891 }
1892 } else if (!g_ascii_strncasecmp(c, "ftp.", 4) && (c == text || badchar(c[-1]) || badentity(c-1))) {
1893 if (c[4] != '.') {
1894 t = c;
1895 while (1) {
1896 if (badchar(*t) || badentity(t)) {
1897 if (t - c == 4) {
1898 break;
1899 }
1900 if (*(t - 1) == '.')
1901 t--;
1902 if ((*(t - 1) == ')' && (inside_paren > 0))) {
1903 t--;
1904 }
1905 url_buf = g_strndup(c, t - c);
1906 tmpurlbuf = gaim_unescape_html(url_buf);
1907 g_string_append_printf(ret,
1908 "<A HREF=\"ftp://%s\">%s</A>", tmpurlbuf,
1909 url_buf);
1910 g_free(url_buf);
1911 g_free(tmpurlbuf);
1912 c = t;
1913 break;
1914 }
1915 if (!t)
1916 break;
1917 t++;
1918 }
1919 }
1920 } else if (!g_ascii_strncasecmp(c, "mailto:", 7)) {
1921 t = c;
1922 while (1) {
1923 if (badchar(*t) || badentity(t)) {
1924 if (*(t - 1) == '.')
1925 t--;
1926 url_buf = g_strndup(c, t - c);
1927 tmpurlbuf = gaim_unescape_html(url_buf);
1928 g_string_append_printf(ret, "<A HREF=\"%s\">%s</A>",
1929 tmpurlbuf, url_buf);
1930 g_free(url_buf);
1931 g_free(tmpurlbuf);
1932 c = t;
1933 break;
1934 }
1935 if (!t)
1936 break;
1937 t++;
1938
1939 }
1940 } else if (c != text && (*c == '@')) {
1941 int flag;
1942 GString *gurl_buf = NULL;
1943 const char illegal_chars[] = "!@#$%^&*()[]{}/|\\<>\":;\r\n \0";
1944
1945 if (strchr(illegal_chars,*(c - 1)) || strchr(illegal_chars, *(c + 1)))
1946 flag = 0;
1947 else {
1948 flag = 1;
1949 gurl_buf = g_string_new("");
1950 }
1951
1952 t = c;
1953 while (flag) {
1954 /* iterate backwards grabbing the local part of an email address */
1955 g = g_utf8_get_char(t);
1956 if (badchar(*t) || (g >= 127) || (*t == '(') ||
1957 ((*t == ';') && ((t > (text+2) && (!g_ascii_strncasecmp(t - 3, "&lt;", 4) ||
1958 !g_ascii_strncasecmp(t - 3, "&gt;", 4))) ||
1959 (t > (text+4) && (!g_ascii_strncasecmp(t - 5, "&quot;", 6)))))) {
1960 /* local part will already be part of ret, strip it out */
1961 ret = g_string_truncate(ret, ret->len - (c - t));
1962 ret = g_string_append_unichar(ret, g);
1963 break;
1964 } else {
1965 g_string_prepend_unichar(gurl_buf, g);
1966 t = g_utf8_find_prev_char(text, t);
1967 if (t < text) {
1968 ret = g_string_assign(ret, "");
1969 break;
1970 }
1971 }
1972 }
1973
1974 t = g_utf8_find_next_char(c, NULL);
1975
1976 while (flag) {
1977 /* iterate forwards grabbing the domain part of an email address */
1978 g = g_utf8_get_char(t);
1979 if (badchar(*t) || (g >= 127) || (*t == ')') || badentity(t)) {
1980 char *d;
1981
1982 url_buf = g_string_free(gurl_buf, FALSE);
1983
1984 /* strip off trailing periods */
1985 if (strlen(url_buf) > 0) {
1986 for (d = url_buf + strlen(url_buf) - 1; *d == '.'; d--, t--)
1987 *d = '\0';
1988 }
1989
1990 tmpurlbuf = gaim_unescape_html(url_buf);
1991 if (gaim_email_is_valid(tmpurlbuf)) {
1992 g_string_append_printf(ret, "<A HREF=\"mailto:%s\">%s</A>",
1993 tmpurlbuf, url_buf);
1994 } else {
1995 g_string_append(ret, url_buf);
1996 }
1997 g_free(url_buf);
1998 g_free(tmpurlbuf);
1999 c = t;
2000
2001 break;
2002 } else {
2003 g_string_append_unichar(gurl_buf, g);
2004 t = g_utf8_find_next_char(t, NULL);
2005 }
2006 }
2007 }
2008
2009 if(*c == ')' && !inside_html) {
2010 inside_paren--;
2011 ret = g_string_append_c(ret, *c);
2012 c++;
2013 }
2014
2015 if (*c == 0)
2016 break;
2017
2018 ret = g_string_append_c(ret, *c);
2019 c++;
2020
2021 }
2022 return g_string_free(ret, FALSE);
2023 }
2024
2025 char *
2026 gaim_unescape_html(const char *html) {
2027 if (html != NULL) {
2028 const char *c = html;
2029 GString *ret = g_string_new("");
2030 while (*c) {
2031 int len;
2032 const char *ent;
2033
2034 if ((ent = detect_entity(c, &len)) != NULL) {
2035 ret = g_string_append(ret, ent);
2036 c += len;
2037 } else if (!strncmp(c, "<br>", 4)) {
2038 ret = g_string_append_c(ret, '\n');
2039 c += 4;
2040 } else {
2041 ret = g_string_append_c(ret, *c);
2042 c++;
2043 }
2044 }
2045 return g_string_free(ret, FALSE);
2046 }
2047
2048 return NULL;
2049 }
2050
2051 char *
2052 gaim_markup_slice(const char *str, guint x, guint y)
2053 {
2054 GString *ret;
2055 GQueue *q;
2056 guint z = 0;
2057 gboolean appended = FALSE;
2058 gunichar c;
2059 char *tag;
2060
2061 g_return_val_if_fail(x <= y, NULL);
2062
2063 if (x == y)
2064 return g_strdup("");
2065
2066 ret = g_string_new("");
2067 q = g_queue_new();
2068
2069 while (*str && (z < y)) {
2070 c = g_utf8_get_char(str);
2071
2072 if (c == '<') {
2073 char *end = strchr(str, '>');
2074
2075 if (!end) {
2076 g_string_free(ret, TRUE);
2077 while ((tag = g_queue_pop_head(q)))
2078 g_free(tag);
2079 g_queue_free(q);
2080 return NULL;
2081 }
2082
2083 if (!g_ascii_strncasecmp(str, "<img ", 5)) {
2084 z += strlen("[Image]");
2085 } else if (!g_ascii_strncasecmp(str, "<br", 3)) {
2086 z += 1;
2087 } else if (!g_ascii_strncasecmp(str, "<hr>", 4)) {
2088 z += strlen("\n---\n");
2089 } else if (!g_ascii_strncasecmp(str, "</", 2)) {
2090 /* pop stack */
2091 char *tmp;
2092
2093 tmp = g_queue_pop_head(q);
2094 g_free(tmp);
2095 /* z += 0; */
2096 } else {
2097 /* push it unto the stack */
2098 char *tmp;
2099
2100 tmp = g_strndup(str, end - str + 1);
2101 g_queue_push_head(q, tmp);
2102 /* z += 0; */
2103 }
2104
2105 if (z >= x) {
2106 g_string_append_len(ret, str, end - str + 1);
2107 }
2108
2109 str = end;
2110 } else if (c == '&') {
2111 char *end = strchr(str, ';');
2112 if (!end) {
2113 g_string_free(ret, TRUE);
2114 while ((tag = g_queue_pop_head(q)))
2115 g_free(tag);
2116 g_queue_free(q);
2117
2118 return NULL;
2119 }
2120
2121 if (z >= x)
2122 g_string_append_len(ret, str, end - str + 1);
2123
2124 z++;
2125 str = end;
2126 } else {
2127 if (z == x && z > 0 && !appended) {
2128 GList *l = q->tail;
2129
2130 while (l) {
2131 tag = l->data;
2132 g_string_append(ret, tag);
2133 l = l->prev;
2134 }
2135 appended = TRUE;
2136 }
2137
2138 if (z >= x)
2139 g_string_append_unichar(ret, c);
2140 z++;
2141 }
2142
2143 str = g_utf8_next_char(str);
2144 }
2145
2146 while ((tag = g_queue_pop_head(q))) {
2147 char *name;
2148
2149 name = gaim_markup_get_tag_name(tag);
2150 g_string_append_printf(ret, "</%s>", name);
2151 g_free(name);
2152 g_free(tag);
2153 }
2154
2155 g_queue_free(q);
2156 return g_string_free(ret, FALSE);
2157 }
2158
2159 char *
2160 gaim_markup_get_tag_name(const char *tag)
2161 {
2162 int i;
2163 g_return_val_if_fail(tag != NULL, NULL);
2164 g_return_val_if_fail(*tag == '<', NULL);
2165
2166 for (i = 1; tag[i]; i++)
2167 if (tag[i] == '>' || tag[i] == ' ' || tag[i] == '/')
2168 break;
2169
2170 return g_strndup(tag+1, i-1);
2171 }
2172
2173 /**************************************************************************
2174 * Path/Filename Functions
2175 **************************************************************************/
2176 const char *
2177 gaim_home_dir(void)
2178 {
2179 #ifndef _WIN32
2180 return g_get_home_dir();
2181 #else
2182 return wgaim_data_dir();
2183 #endif
2184 }
2185
2186 /* returns a string of the form ~/.gaim, where ~ is replaced by the user's home
2187 * dir. Note that there is no trailing slash after .gaim. */
2188 const char *
2189 gaim_user_dir(void)
2190 {
2191 if (custom_home_dir != NULL && strlen(custom_home_dir) > 0) {
2192 strcpy ((char*) &home_dir, (char*) &custom_home_dir);
2193 } else {
2194 const gchar *hd = gaim_home_dir();
2195
2196 if (hd) {
2197 g_strlcpy((char*) &home_dir, hd, sizeof(home_dir));
2198 g_strlcat((char*) &home_dir, G_DIR_SEPARATOR_S ".gaim",
2199 sizeof(home_dir));
2200 }
2201 }
2202
2203 return home_dir;
2204 }
2205
2206 void gaim_util_set_user_dir(const char *dir)
2207 {
2208 if (dir != NULL && strlen(dir) > 0) {
2209 g_strlcpy((char*) &custom_home_dir, dir,
2210 sizeof(custom_home_dir));
2211 }
2212 }
2213
2214 int gaim_build_dir (const char *path, int mode)
2215 {
2216 #if GLIB_CHECK_VERSION(2,8,0)
2217 return g_mkdir_with_parents(path, mode);
2218 #else
2219 char *dir, **components, delim[] = { G_DIR_SEPARATOR, '\0' };
2220 int cur, len;
2221
2222 g_return_val_if_fail(path != NULL, -1);
2223
2224 dir = g_new0(char, strlen(path) + 1);
2225 components = g_strsplit(path, delim, -1);
2226 len = 0;
2227 for (cur = 0; components[cur] != NULL; cur++) {
2228 /* If you don't know what you're doing on both
2229 * win32 and *NIX, stay the hell away from this code */
2230 if(cur > 1)
2231 dir[len++] = G_DIR_SEPARATOR;
2232 strcpy(dir + len, components[cur]);
2233 len += strlen(components[cur]);
2234 if(cur == 0)
2235 dir[len++] = G_DIR_SEPARATOR;
2236
2237 if(g_file_test(dir, G_FILE_TEST_IS_DIR)) {
2238 continue;
2239 #ifdef _WIN32
2240 /* allow us to create subdirs on UNC paths
2241 * (\\machinename\path\to\blah)
2242 * g_file_test() doesn't work on "\\machinename" */
2243 } else if (cur == 2 && dir[0] == '\\' && dir[1] == '\\'
2244 && components[cur + 1] != NULL) {
2245 continue;
2246 #endif
2247 } else if(g_file_test(dir, G_FILE_TEST_EXISTS)) {
2248 gaim_debug_warning("build_dir", "bad path: %s\n", path);
2249 g_strfreev(components);
2250 g_free(dir);
2251 return -1;
2252 }
2253
2254 if (g_mkdir(dir, mode) < 0) {
2255 gaim_debug_warning("build_dir", "mkdir: %s\n", strerror(errno));
2256 g_strfreev(components);
2257 g_free(dir);
2258 return -1;
2259 }
2260 }
2261
2262 g_strfreev(components);
2263 g_free(dir);
2264 return 0;
2265 #endif
2266 }
2267
2268 /*
2269 * This function is long and beautiful, like my--um, yeah. Anyway,
2270 * it includes lots of error checking so as we don't overwrite
2271 * people's settings if there is a problem writing the new values.
2272 */
2273 gboolean
2274 gaim_util_write_data_to_file(const char *filename, const char *data, size_t size)
2275 {
2276 const char *user_dir = gaim_user_dir();
2277 gchar *filename_temp, *filename_full;
2278 FILE *file;
2279 size_t real_size, byteswritten;
2280 struct stat st;
2281
2282 g_return_val_if_fail(user_dir != NULL, FALSE);
2283
2284 gaim_debug_info("util", "Writing file %s to directory %s\n",
2285 filename, user_dir);
2286
2287 /* Ensure the user directory exists */
2288 if (!g_file_test(user_dir, G_FILE_TEST_IS_DIR))
2289 {
2290 if (g_mkdir(user_dir, S_IRUSR | S_IWUSR | S_IXUSR) == -1)
2291 {
2292 gaim_debug_error("util", "Error creating directory %s: %s\n",
2293 user_dir, strerror(errno));
2294 return FALSE;
2295 }
2296 }
2297
2298 filename_full = g_strdup_printf("%s" G_DIR_SEPARATOR_S "%s", user_dir, filename);
2299 filename_temp = g_strdup_printf("%s.save", filename_full);
2300
2301 /* Remove an old temporary file, if one exists */
2302 if (g_file_test(filename_temp, G_FILE_TEST_EXISTS))
2303 {
2304 if (g_unlink(filename_temp) == -1)
2305 {
2306 gaim_debug_error("util", "Error removing old file %s: %s\n",
2307 filename_temp, strerror(errno));
2308 }
2309 }
2310
2311 /* Open file */
2312 file = g_fopen(filename_temp, "wb");
2313 if (file == NULL)
2314 {
2315 gaim_debug_error("util", "Error opening file %s for writing: %s\n",
2316 filename_temp, strerror(errno));
2317 g_free(filename_full);
2318 g_free(filename_temp);
2319 return FALSE;
2320 }
2321
2322 /* Write to file */
2323 real_size = (size == -1) ? strlen(data) : size;
2324 byteswritten = fwrite(data, 1, real_size, file);
2325
2326 /* Close file */
2327 if (fclose(file) != 0)
2328 {
2329 gaim_debug_error("util", "Error closing file %s: %s\n",
2330 filename_temp, strerror(errno));
2331 g_free(filename_full);
2332 g_free(filename_temp);
2333 return FALSE;
2334 }
2335
2336 /* Ensure the file is the correct size */
2337 if (byteswritten != real_size)
2338 {
2339 gaim_debug_error("util", "Error writing to file %s: Wrote %" G_GSIZE_FORMAT " bytes "
2340 "but should have written %" G_GSIZE_FORMAT "; is your disk full?\n",
2341 filename_temp, byteswritten, real_size);
2342 g_free(filename_full);
2343 g_free(filename_temp);
2344 return FALSE;
2345 }
2346 /* Use stat to be absolutely sure. */
2347 if ((g_stat(filename_temp, &st) == -1) || (st.st_size != real_size))
2348 {
2349 gaim_debug_error("util", "Error writing data to file %s: "
2350 "Incomplete file written; is your disk full?\n",
2351 filename_temp);
2352 g_free(filename_full);
2353 g_free(filename_temp);
2354 return FALSE;
2355 }
2356
2357 #ifndef _WIN32
2358 /* Set file permissions */
2359 if (chmod(filename_temp, S_IRUSR | S_IWUSR) == -1)
2360 {
2361 gaim_debug_error("util", "Error setting permissions of file %s: %s\n",
2362 filename_temp, strerror(errno));
2363 }
2364 #endif
2365
2366 /* Rename to the REAL name */
2367 if (g_rename(filename_temp, filename_full) == -1)
2368 {
2369 gaim_debug_error("util", "Error renaming %s to %s: %s\n",
2370 filename_temp, filename_full, strerror(errno));
2371 }
2372
2373 g_free(filename_full);
2374 g_free(filename_temp);
2375
2376 return TRUE;
2377 }
2378
2379 xmlnode *
2380 gaim_util_read_xml_from_file(const char *filename, const char *description)
2381 {
2382 const char *user_dir = gaim_user_dir();
2383 gchar *filename_full;
2384 GError *error = NULL;
2385 gchar *contents = NULL;
2386 gsize length;
2387 xmlnode *node = NULL;
2388
2389 g_return_val_if_fail(user_dir != NULL, NULL);
2390
2391 gaim_debug_info("util", "Reading file %s from directory %s\n",
2392 filename, user_dir);
2393
2394 filename_full = g_build_filename(user_dir, filename, NULL);
2395
2396 if (!g_file_test(filename_full, G_FILE_TEST_EXISTS))
2397 {
2398 gaim_debug_info("util", "File %s does not exist (this is not "
2399 "necessarily an error)\n", filename_full);
2400 g_free(filename_full);
2401 return NULL;
2402 }
2403
2404 if (!g_file_get_contents(filename_full, &contents, &length, &error))
2405 {
2406 gaim_debug_error("util", "Error reading file %s: %s\n",
2407 filename_full, error->message);
2408 g_error_free(error);
2409 }
2410
2411 if ((contents != NULL) && (length > 0))
2412 {
2413 node = xmlnode_from_str(contents, length);
2414
2415 /* If we were unable to parse the file then save its contents to a backup file */
2416 if (node == NULL)
2417 {
2418 gchar *filename_temp;
2419
2420 filename_temp = g_strdup_printf("%s~", filename);
2421 gaim_debug_error("util", "Error parsing file %s. Renaming old "
2422 "file to %s\n", filename_full, filename_temp);
2423 gaim_util_write_data_to_file(filename_temp, contents, length);
2424 g_free(filename_temp);
2425 }
2426
2427 g_free(contents);
2428 }
2429
2430 /* If we could not parse the file then show the user an error message */
2431 if (node == NULL)
2432 {
2433 gchar *title, *msg;
2434 title = g_strdup_printf(_("Error Reading %s"), filename);
2435 msg = g_strdup_printf(_("An error was encountered reading your "
2436 "%s. They have not been loaded, and the old file "
2437 "has been renamed to %s~."), description, filename_full);
2438 gaim_notify_error(NULL, NULL, title, msg);
2439 g_free(title);
2440 g_free(msg);
2441 }
2442
2443 g_free(filename_full);
2444
2445 return node;
2446 }
2447
2448 /*
2449 * Like mkstemp() but returns a file pointer, uses a pre-set template,
2450 * uses the semantics of tempnam() for the directory to use and allocates
2451 * the space for the filepath.
2452 *
2453 * Caller is responsible for closing the file and removing it when done,
2454 * as well as freeing the space pointed-to by "path" with g_free().
2455 *
2456 * Returns NULL on failure and cleans up after itself if so.
2457 */
2458 static const char *gaim_mkstemp_templ = {"gaimXXXXXX"};
2459
2460 FILE *
2461 gaim_mkstemp(char **fpath, gboolean binary)
2462 {
2463 const gchar *tmpdir;
2464 #ifndef _WIN32
2465 int fd;
2466 #endif
2467 FILE *fp = NULL;
2468
2469 g_return_val_if_fail(fpath != NULL, NULL);
2470
2471 if((tmpdir = (gchar*)g_get_tmp_dir()) != NULL) {
2472 if((*fpath = g_strdup_printf("%s" G_DIR_SEPARATOR_S "%s", tmpdir, gaim_mkstemp_templ)) != NULL) {
2473 #ifdef _WIN32
2474 char* result = _mktemp( *fpath );
2475 if( result == NULL )
2476 gaim_debug(GAIM_DEBUG_ERROR, "gaim_mkstemp",
2477 "Problem creating the template\n");
2478 else
2479 {
2480 if( (fp = g_fopen( result, binary?"wb+":"w+")) == NULL ) {
2481 gaim_debug(GAIM_DEBUG_ERROR, "gaim_mkstemp",
2482 "Couldn't fopen() %s\n", result);
2483 }
2484 }
2485 #else
2486 if((fd = mkstemp(*fpath)) == -1) {
2487 gaim_debug(GAIM_DEBUG_ERROR, "gaim_mkstemp",
2488 "Couldn't make \"%s\", error: %d\n",
2489 *fpath, errno);
2490 } else {
2491 if((fp = fdopen(fd, "r+")) == NULL) {
2492 close(fd);
2493 gaim_debug(GAIM_DEBUG_ERROR, "gaim_mkstemp",
2494 "Couldn't fdopen(), error: %d\n", errno);
2495 }
2496 }
2497 #endif
2498 if(!fp) {
2499 g_free(*fpath);
2500 *fpath = NULL;
2501 }
2502 }
2503 } else {
2504 gaim_debug(GAIM_DEBUG_ERROR, "gaim_mkstemp",
2505 "g_get_tmp_dir() failed!\n");
2506 }
2507
2508 return fp;
2509 }
2510
2511 gboolean
2512 gaim_program_is_valid(const char *program)
2513 {
2514 GError *error = NULL;
2515 char **argv;
2516 gchar *progname;
2517 gboolean is_valid = FALSE;
2518
2519 g_return_val_if_fail(program != NULL, FALSE);
2520 g_return_val_if_fail(*program != '\0', FALSE);
2521
2522 if (!g_shell_parse_argv(program, NULL, &argv, &error)) {
2523 gaim_debug(GAIM_DEBUG_ERROR, "program_is_valid",
2524 "Could not parse program '%s': %s\n",
2525 program, error->message);
2526 g_error_free(error);
2527 return FALSE;
2528 }
2529
2530 if (argv == NULL) {
2531 return FALSE;
2532 }
2533
2534 progname = g_find_program_in_path(argv[0]);
2535 is_valid = (progname != NULL);
2536
2537 g_strfreev(argv);
2538 g_free(progname);
2539
2540 return is_valid;
2541 }
2542
2543
2544 gboolean
2545 gaim_running_gnome(void)
2546 {
2547 #ifndef _WIN32
2548 gchar *tmp = g_find_program_in_path("gnome-open");
2549
2550 if (tmp == NULL)
2551 return FALSE;
2552 g_free(tmp);
2553
2554 return (g_getenv("GNOME_DESKTOP_SESSION_ID") != NULL);
2555 #else
2556 return FALSE;
2557 #endif
2558 }
2559
2560 gboolean
2561 gaim_running_kde(void)
2562 {
2563 #ifndef _WIN32
2564 gchar *tmp = g_find_program_in_path("kfmclient");
2565 const char *session;
2566
2567 if (tmp == NULL)
2568 return FALSE;
2569 g_free(tmp);
2570
2571 session = g_getenv("KDE_FULL_SESSION");
2572 if (session != NULL && !strcmp(session, "true"))
2573 return TRUE;
2574
2575 /* If you run Gaim from Konsole under !KDE, this will provide a
2576 * a false positive. Since we do the GNOME checks first, this is
2577 * only a problem if you're running something !(KDE || GNOME) and
2578 * you run Gaim from Konsole. This really shouldn't be a problem. */
2579 return ((g_getenv("KDEDIR") != NULL) || g_getenv("KDEDIRS") != NULL);
2580 #else
2581 return FALSE;
2582 #endif
2583 }
2584
2585 gboolean
2586 gaim_running_osx(void)
2587 {
2588 #if defined(__APPLE__)
2589 return TRUE;
2590 #else
2591 return FALSE;
2592 #endif
2593 }
2594
2595 char *
2596 gaim_fd_get_ip(int fd)
2597 {
2598 struct sockaddr addr;
2599 socklen_t namelen = sizeof(addr);
2600
2601 g_return_val_if_fail(fd != 0, NULL);
2602
2603 if (getsockname(fd, &addr, &namelen))
2604 return NULL;
2605
2606 return g_strdup(inet_ntoa(((struct sockaddr_in *)&addr)->sin_addr));
2607 }
2608
2609
2610 /**************************************************************************
2611 * String Functions
2612 **************************************************************************/
2613 const char *
2614 gaim_normalize(const GaimAccount *account, const char *str)
2615 {
2616 const char *ret = NULL;
2617
2618 if (account != NULL)
2619 {
2620 GaimPlugin *prpl = gaim_find_prpl(gaim_account_get_protocol_id(account));
2621
2622 if (prpl != NULL)
2623 {
2624 GaimPluginProtocolInfo *prpl_info = GAIM_PLUGIN_PROTOCOL_INFO(prpl);
2625
2626 if(prpl_info && prpl_info->normalize)
2627 ret = prpl_info->normalize(account, str);
2628 }
2629 }
2630
2631 if (ret == NULL)
2632 {
2633 static char buf[BUF_LEN];
2634 char *tmp;
2635
2636 tmp = g_utf8_normalize(str, -1, G_NORMALIZE_DEFAULT);
2637 g_snprintf(buf, sizeof(buf), "%s", tmp);
2638 g_free(tmp);
2639
2640 ret = buf;
2641 }
2642
2643 return ret;
2644 }
2645
2646 /*
2647 * You probably don't want to call this directly, it is
2648 * mainly for use as a PRPL callback function. See the
2649 * comments in util.h.
2650 */
2651 const char *
2652 gaim_normalize_nocase(const GaimAccount *account, const char *str)
2653 {
2654 static char buf[BUF_LEN];
2655 char *tmp1, *tmp2;
2656
2657 g_return_val_if_fail(str != NULL, NULL);
2658
2659 tmp1 = g_utf8_strdown(str, -1);
2660 tmp2 = g_utf8_normalize(tmp1, -1, G_NORMALIZE_DEFAULT);
2661 g_snprintf(buf, sizeof(buf), "%s", tmp2 ? tmp2 : "");
2662 g_free(tmp2);
2663 g_free(tmp1);
2664
2665 return buf;
2666 }
2667
2668 gchar *
2669 gaim_strdup_withhtml(const gchar *src)
2670 {
2671 gulong destsize, i, j;
2672 gchar *dest;
2673
2674 g_return_val_if_fail(src != NULL, NULL);
2675
2676 /* New length is (length of src) + (number of \n's * 3) - (number of \r's) + 1 */
2677 destsize = 1;
2678 for (i = 0; src[i] != '\0'; i++)
2679 {
2680 if (src[i] == '\n')
2681 destsize += 4;
2682 else if (src[i] != '\r')
2683 destsize++;
2684 }
2685
2686 dest = g_malloc(destsize);
2687
2688 /* Copy stuff, ignoring \r's, because they are dumb */
2689 for (i = 0, j = 0; src[i] != '\0'; i++) {
2690 if (src[i] == '\n') {
2691 strcpy(&dest[j], "<BR>");
2692 j += 4;
2693 } else if (src[i] != '\r')
2694 dest[j++] = src[i];
2695 }
2696
2697 dest[destsize-1] = '\0';
2698
2699 return dest;
2700 }
2701
2702 gboolean
2703 gaim_str_has_prefix(const char *s, const char *p)
2704 {
2705 #if GLIB_CHECK_VERSION(2,2,0)
2706 return g_str_has_prefix(s, p);
2707 #else
2708 g_return_val_if_fail(s != NULL, FALSE);
2709 g_return_val_if_fail(p != NULL, FALSE);
2710
2711 return (!strncmp(s, p, strlen(p)));
2712 #endif
2713 }
2714
2715 gboolean
2716 gaim_str_has_suffix(const char *s, const char *x)
2717 {
2718 #if GLIB_CHECK_VERSION(2,2,0)
2719 return g_str_has_suffix(s, x);
2720 #else
2721 int off;
2722
2723 g_return_val_if_fail(s != NULL, FALSE);
2724 g_return_val_if_fail(x != NULL, FALSE);
2725
2726 off = strlen(s) - strlen(x);
2727 return (off >= 0 && !strcmp(s + off, x));
2728 #endif
2729 }
2730
2731 char *
2732 gaim_str_add_cr(const char *text)
2733 {
2734 char *ret = NULL;
2735 int count = 0, j;
2736 guint i;
2737
2738 g_return_val_if_fail(text != NULL, NULL);
2739
2740 if (text[0] == '\n')
2741 count++;
2742 for (i = 1; i < strlen(text); i++)
2743 if (text[i] == '\n' && text[i - 1] != '\r')
2744 count++;
2745
2746 if (count == 0)
2747 return g_strdup(text);
2748
2749 ret = g_malloc0(strlen(text) + count + 1);
2750
2751 i = 0; j = 0;
2752 if (text[i] == '\n')
2753 ret[j++] = '\r';
2754 ret[j++] = text[i++];
2755 for (; i < strlen(text); i++) {
2756 if (text[i] == '\n' && text[i - 1] != '\r')
2757 ret[j++] = '\r';
2758 ret[j++] = text[i];
2759 }
2760
2761 gaim_debug_misc("gaim_str_add_cr", "got: %s, leaving with %s\n",
2762 text, ret);
2763
2764 return ret;
2765 }
2766
2767 void
2768 gaim_str_strip_char(char *text, char thechar)
2769 {
2770 int i, j;
2771
2772 g_return_if_fail(text != NULL);
2773
2774 for (i = 0, j = 0; text[i]; i++)
2775 if (text[i] != thechar)
2776 text[j++] = text[i];
2777
2778 text[j++] = '\0';
2779 }
2780
2781 void
2782 gaim_util_chrreplace(char *string, char delimiter,
2783 char replacement)
2784 {
2785 int i = 0;
2786
2787 g_return_if_fail(string != NULL);
2788
2789 while (string[i] != '\0')
2790 {
2791 if (string[i] == delimiter)
2792 string[i] = replacement;
2793 i++;
2794 }
2795 }
2796
2797 gchar *
2798 gaim_strreplace(const char *string, const char *delimiter,
2799 const char *replacement)
2800 {
2801 gchar **split;
2802 gchar *ret;
2803
2804 g_return_val_if_fail(string != NULL, NULL);
2805 g_return_val_if_fail(delimiter != NULL, NULL);
2806 g_return_val_if_fail(replacement != NULL, NULL);
2807
2808 split = g_strsplit(string, delimiter, 0);
2809 ret = g_strjoinv(replacement, split);
2810 g_strfreev(split);
2811
2812 return ret;
2813 }
2814
2815 gchar *
2816 gaim_strcasereplace(const char *string, const char *delimiter,
2817 const char *replacement)
2818 {
2819 gchar *ret;
2820 int length_del, length_rep, i, j;
2821
2822 g_return_val_if_fail(string != NULL, NULL);
2823 g_return_val_if_fail(delimiter != NULL, NULL);
2824 g_return_val_if_fail(replacement != NULL, NULL);
2825
2826 length_del = strlen(delimiter);
2827 length_rep = strlen(replacement);
2828
2829 /* Count how many times the delimiter appears */
2830 i = 0; /* position in the source string */
2831 j = 0; /* number of occurrences of "delimiter" */
2832 while (string[i] != '\0') {
2833 if (!strncasecmp(&string[i], delimiter, length_del)) {
2834 i += length_del;
2835 j += length_rep;
2836 } else {
2837 i++;
2838 j++;
2839 }
2840 }
2841
2842 ret = g_malloc(j+1);
2843
2844 i = 0; /* position in the source string */
2845 j = 0; /* position in the destination string */
2846 while (string[i] != '\0') {
2847 if (!strncasecmp(&string[i], delimiter, length_del)) {
2848 strncpy(&ret[j], replacement, length_rep);
2849 i += length_del;
2850 j += length_rep;
2851 } else {
2852 ret[j] = string[i];
2853 i++;
2854 j++;
2855 }
2856 }
2857
2858 ret[j] = '\0';
2859
2860 return ret;
2861 }
2862
2863 const char *
2864 gaim_strcasestr(const char *haystack, const char *needle)
2865 {
2866 size_t hlen, nlen;
2867 const char *tmp, *ret;
2868
2869 g_return_val_if_fail(haystack != NULL, NULL);
2870 g_return_val_if_fail(needle != NULL, NULL);
2871
2872 hlen = strlen(haystack);
2873 nlen = strlen(needle);
2874 tmp = haystack,
2875 ret = NULL;
2876
2877 g_return_val_if_fail(hlen > 0, NULL);
2878 g_return_val_if_fail(nlen > 0, NULL);
2879
2880 while (*tmp && !ret) {
2881 if (!g_ascii_strncasecmp(needle, tmp, nlen))
2882 ret = tmp;
2883 else
2884 tmp++;
2885 }
2886
2887 return ret;
2888 }
2889
2890 char *
2891 gaim_str_size_to_units(size_t size)
2892 {
2893 static const char *size_str[4] = { "bytes", "KB", "MB", "GB" };
2894 float size_mag;
2895 int size_index = 0;
2896
2897 if (size == -1) {
2898 return g_strdup(_("Calculating..."));
2899 }
2900 else if (size == 0) {
2901 return g_strdup(_("Unknown."));
2902 }
2903 else {
2904 size_mag = (float)size;
2905
2906 while ((size_index < 3) && (size_mag > 1024)) {
2907 size_mag /= 1024;
2908 size_index++;
2909 }
2910
2911 if (size_index == 0) {
2912 return g_strdup_printf("%" G_GSIZE_FORMAT " %s", size, size_str[size_index]);
2913 } else {
2914 return g_strdup_printf("%.2f %s", size_mag, size_str[size_index]);
2915 }
2916 }
2917 }
2918
2919 char *
2920 gaim_str_seconds_to_string(guint secs)
2921 {
2922 char *ret = NULL;
2923 guint days, hrs, mins;
2924
2925 if (secs < 60)
2926 {
2927 return g_strdup_printf(ngettext("%d second", "%d seconds", secs), secs);
2928 }
2929
2930 days = secs / (60 * 60 * 24);
2931 secs = secs % (60 * 60 * 24);
2932 hrs = secs / (60 * 60);
2933 secs = secs % (60 * 60);
2934 mins = secs / 60;
2935 secs = secs % 60;
2936
2937 if (days > 0)
2938 {
2939 ret = g_strdup_printf(ngettext("%d day", "%d days", days), days);
2940 }
2941
2942 if (hrs > 0)
2943 {
2944 if (ret != NULL)
2945 {
2946 char *tmp = g_strdup_printf(
2947 ngettext("%s, %d hour", "%s, %d hours", hrs),
2948 ret, hrs);
2949 g_free(ret);
2950 ret = tmp;
2951 }
2952 else
2953 ret = g_strdup_printf(ngettext("%d hour", "%d hours", hrs), hrs);
2954 }
2955
2956 if (mins > 0)
2957 {
2958 if (ret != NULL)
2959 {
2960 char *tmp = g_strdup_printf(
2961 ngettext("%s, %d minute", "%s, %d minutes", mins),
2962 ret, mins);
2963 g_free(ret);
2964 ret = tmp;
2965 }
2966 else
2967 ret = g_strdup_printf(ngettext("%d minute", "%d minutes", mins), mins);
2968 }
2969
2970 return ret;
2971 }
2972
2973
2974 char *
2975 gaim_str_binary_to_ascii(const unsigned char *binary, guint len)
2976 {
2977 GString *ret;
2978 guint i;
2979
2980 g_return_val_if_fail(len > 0, NULL);
2981
2982 ret = g_string_sized_new(len);
2983
2984 for (i = 0; i < len; i++)
2985 if (binary[i] < 32 || binary[i] > 126)
2986 g_string_append_printf(ret, "\\x%02hhx", binary[i]);
2987 else if (binary[i] == '\\')
2988 g_string_append(ret, "\\\\");
2989 else
2990 g_string_append_c(ret, binary[i]);
2991
2992 return g_string_free(ret, FALSE);
2993 }
2994
2995 /**************************************************************************
2996 * URI/URL Functions
2997 **************************************************************************/
2998 gboolean
2999 gaim_url_parse(const char *url, char **ret_host, int *ret_port,
3000 char **ret_path, char **ret_user, char **ret_passwd)
3001 {
3002 char scan_info[255];
3003 char port_str[6];
3004 int f;
3005 const char *at, *slash;
3006 const char *turl;
3007 char host[256], path[256], user[256], passwd[256];
3008 int port = 0;
3009 /* hyphen at end includes it in control set */
3010 static char addr_ctrl[] = "A-Za-z0-9.-";
3011 static char port_ctrl[] = "0-9";
3012 static char page_ctrl[] = "A-Za-z0-9.~_/:*!@&%%?=+^-";
3013 static char user_ctrl[] = "A-Za-z0-9.~_/*!&%%?=+^-";
3014 static char passwd_ctrl[] = "A-Za-z0-9.~_/*!&%%?=+^-";
3015
3016 g_return_val_if_fail(url != NULL, FALSE);
3017
3018 if ((turl = strstr(url, "http://")) != NULL ||
3019 (turl = strstr(url, "HTTP://")) != NULL)
3020 {
3021 turl += 7;
3022 url = turl;
3023 }
3024
3025 /* parse out authentication information if supplied */
3026 /* Only care about @ char BEFORE the first / */
3027 at = strchr(url, '@');
3028 slash = strchr(url, '/');
3029 if ((at != NULL) &&
3030 (((slash != NULL) && (strlen(at) > strlen(slash))) ||
3031 (slash == NULL))) {
3032 g_snprintf(scan_info, sizeof(scan_info),
3033 "%%255[%s]:%%255[%s]^@", user_ctrl, passwd_ctrl);
3034 f = sscanf(url, scan_info, user, passwd);
3035
3036 if (f ==1 ) {
3037 /* No passwd, possibly just username supplied */
3038 g_snprintf(scan_info, sizeof(scan_info),
3039 "%%255[%s]^@", user_ctrl);
3040 f = sscanf(url, scan_info, user);
3041 *passwd = '\0';
3042 }
3043
3044 url = at+1; /* move pointer after the @ char */
3045 } else {
3046 *user = '\0';
3047 *passwd = '\0';
3048 }
3049
3050 g_snprintf(scan_info, sizeof(scan_info),
3051 "%%255[%s]:%%5[%s]/%%255[%s]", addr_ctrl, port_ctrl, page_ctrl);
3052
3053 f = sscanf(url, scan_info, host, port_str, path);
3054
3055 if (f == 1)
3056 {
3057 g_snprintf(scan_info, sizeof(scan_info),
3058 "%%255[%s]/%%255[%s]",
3059 addr_ctrl, page_ctrl);
3060 f = sscanf(url, scan_info, host, path);
3061 g_snprintf(port_str, sizeof(port_str), "80");
3062 }
3063
3064 if (f == 1)
3065 *path = '\0';
3066
3067 sscanf(port_str, "%d", &port);
3068
3069 if (ret_host != NULL) *ret_host = g_strdup(host);
3070 if (ret_port != NULL) *ret_port = port;
3071 if (ret_path != NULL) *ret_path = g_strdup(path);
3072 if (ret_user != NULL) *ret_user = g_strdup(user);
3073 if (ret_passwd != NULL) *ret_passwd = g_strdup(passwd);
3074
3075 return TRUE;
3076 }
3077
3078 /**
3079 * The arguments to this function are similar to printf.
3080 */
3081 static void
3082 gaim_util_fetch_url_error(GaimUtilFetchUrlData *gfud, const char *format, ...)
3083 {
3084 gchar *error_message;
3085 va_list args;
3086
3087 va_start(args, format);
3088 error_message = g_strdup_vprintf(format, args);
3089 va_end(args);
3090
3091 gfud->callback(gfud, gfud->user_data, NULL, 0, error_message);
3092 g_free(error_message);
3093 gaim_util_fetch_url_cancel(gfud);
3094 }
3095
3096 static void url_fetch_connect_cb(gpointer url_data, gint source, const gchar *error_message);
3097
3098 static gboolean
3099 parse_redirect(const char *data, size_t data_len, gint sock,
3100 GaimUtilFetchUrlData *gfud)
3101 {
3102 gchar *s;
3103
3104 if ((s = g_strstr_len(data, data_len, "Location: ")) != NULL)
3105 {
3106 gchar *new_url, *temp_url, *end;
3107 gboolean full;
3108 int len;
3109
3110 s += strlen("Location: ");
3111 end = strchr(s, '\r');
3112
3113 /* Just in case :) */
3114 if (end == NULL)
3115 end = strchr(s, '\n');
3116
3117 if (end == NULL)
3118 return FALSE;
3119
3120 len = end - s;
3121
3122 new_url = g_malloc(len + 1);
3123 strncpy(new_url, s, len);
3124 new_url[len] = '\0';
3125
3126 full = gfud->full;
3127
3128 if (*new_url == '/' || g_strstr_len(new_url, len, "://") == NULL)
3129 {
3130 temp_url = new_url;
3131
3132 new_url = g_strdup_printf("%s:%d%s", gfud->website.address,
3133 gfud->website.port, temp_url);
3134
3135 g_free(temp_url);
3136
3137 full = FALSE;
3138 }
3139
3140 gaim_debug_info("util", "Redirecting to %s\n", new_url);
3141
3142 /*
3143 * Try again, with this new location. This code is somewhat
3144 * ugly, but we need to reuse the gfud because whoever called
3145 * us is holding a reference to it.
3146 */
3147 g_free(gfud->url);
3148 gfud->url = new_url;
3149 gfud->full = full;
3150 g_free(gfud->request);
3151 gfud->request = NULL;
3152
3153 g_free(gfud->website.user);
3154 g_free(gfud->website.passwd);
3155 g_free(gfud->website.address);
3156 g_free(gfud->website.page);
3157 gaim_url_parse(new_url, &gfud->website.address, &gfud->website.port,
3158 &gfud->website.page, &gfud->website.user, &gfud->website.passwd);
3159
3160 gfud->connect_data = gaim_proxy_connect(NULL, NULL,
3161 gfud->website.address, gfud->website.port,
3162 url_fetch_connect_cb, gfud);
3163
3164 if (gfud->connect_data == NULL)
3165 {
3166 gaim_util_fetch_url_error(gfud, _("Unable to connect to %s"),
3167 gfud->website.address);
3168 }
3169
3170 return TRUE;
3171 }
3172
3173 return FALSE;
3174 }
3175
3176 static size_t
3177 parse_content_len(const char *data, size_t data_len)
3178 {
3179 size_t content_len = 0;
3180 const char *p = NULL;
3181
3182 /* This is still technically wrong, since headers are case-insensitive
3183 * [RFC 2616, section 4.2], though this ought to catch the normal case.
3184 * Note: data is _not_ nul-terminated.
3185 */
3186 if(data_len > 16) {
3187 p = (strncmp(data, "Content-Length: ", 16) == 0) ? data : NULL;
3188 if(!p)
3189 p = (strncmp(data, "CONTENT-LENGTH: ", 16) == 0)
3190 ? data : NULL;
3191 if(!p) {
3192 p = g_strstr_len(data, data_len, "\nContent-Length: ");
3193 if (p)
3194 p++;
3195 }
3196 if(!p) {
3197 p = g_strstr_len(data, data_len, "\nCONTENT-LENGTH: ");
3198 if (p)
3199 p++;
3200 }
3201
3202 if(p)
3203 p += 16;
3204 }
3205
3206 /* If we can find a Content-Length header at all, try to sscanf it.
3207 * Response headers should end with at least \r\n, so sscanf is safe,
3208 * if we make sure that there is indeed a \n in our header.
3209 */
3210 if (p && g_strstr_len(p, data_len - (p - data), "\n")) {
3211 sscanf(p, "%" G_GSIZE_FORMAT, &content_len);
3212 gaim_debug_misc("util", "parsed %u\n", content_len);
3213 }
3214
3215 return content_len;
3216 }
3217
3218
3219 static void
3220 url_fetch_recv_cb(gpointer url_data, gint source, GaimInputCondition cond)
3221 {
3222 GaimUtilFetchUrlData *gfud = url_data;
3223 int len;
3224 char buf[4096];
3225 char *data_cursor;
3226 gboolean got_eof = FALSE;
3227
3228 while((len = read(source, buf, sizeof(buf))) > 0) {
3229 /* If we've filled up our buffer, make it bigger */
3230 if((gfud->len + len) >= gfud->data_len) {
3231 while((gfud->len + len) >= gfud->data_len)
3232 gfud->data_len += sizeof(buf);
3233
3234 gfud->webdata = g_realloc(gfud->webdata, gfud->data_len);
3235 }
3236
3237 data_cursor = gfud->webdata + gfud->len;
3238
3239 gfud->len += len;
3240
3241 memcpy(data_cursor, buf, len);
3242
3243 gfud->webdata[gfud->len] = '\0';
3244
3245 if(!gfud->got_headers) {
3246 char *tmp;
3247
3248 /* See if we've reached the end of the headers yet */
3249 if((tmp = strstr(gfud->webdata, "\r\n\r\n"))) {
3250 char * new_data;
3251 guint header_len = (tmp + 4 - gfud->webdata);
3252 size_t content_len;
3253
3254 gaim_debug_misc("util", "Response headers: '%.*s'\n",
3255 header_len, gfud->webdata);
3256
3257 /* See if we can find a redirect. */
3258 if(parse_redirect(gfud->webdata, header_len, source, gfud))
3259 return;
3260
3261 gfud->got_headers = TRUE;
3262
3263 /* No redirect. See if we can find a content length. */
3264 content_len = parse_content_len(gfud->webdata, header_len);
3265
3266 if(content_len == 0) {
3267 /* We'll stick with an initial 8192 */
3268 content_len = 8192;
3269 } else {
3270 gfud->has_explicit_data_len = TRUE;
3271 }
3272
3273
3274 /* If we're returning the headers too, we don't need to clean them out */
3275 if(gfud->include_headers) {
3276 gfud->data_len = content_len + header_len;
3277 gfud->webdata = g_realloc(gfud->webdata, gfud->data_len);
3278 } else {
3279 size_t body_len = 0;
3280
3281 if(gfud->len > (header_len + 1))
3282 body_len = (gfud->len - header_len);
3283
3284 content_len = MAX(content_len, body_len);
3285
3286 new_data = g_try_malloc(content_len);
3287 if(new_data == NULL) {
3288 gaim_debug_error("util",
3289 "Failed to allocate %u bytes: %s\n",
3290 content_len, strerror(errno));
3291 gaim_util_fetch_url_error(gfud,
3292 _("Unable to allocate enough memory to hold "
3293 "the contents from %s. The web server may "
3294 "be trying something malicious."),
3295 gfud->website.address);
3296
3297 return;
3298 }
3299
3300 /* We may have read part of the body when reading the headers, don't lose it */
3301 if(body_len > 0) {
3302 tmp += 4;
3303 memcpy(new_data, tmp, body_len);
3304 }
3305
3306 /* Out with the old... */
3307 g_free(gfud->webdata);
3308
3309 /* In with the new. */
3310 gfud->len = body_len;
3311 gfud->data_len = content_len;
3312 gfud->webdata = new_data;
3313 }
3314 }
3315 }
3316
3317 if(gfud->has_explicit_data_len && gfud->len >= gfud->data_len) {
3318 got_eof = TRUE;
3319 break;
3320 }
3321 }
3322
3323 if(len < 0) {
3324 if(errno == EAGAIN) {
3325 return;
3326 } else {
3327 gaim_util_fetch_url_error(gfud, _("Error reading from %s: %s"),
3328 gfud->website.address, strerror(errno));
3329 return;
3330 }
3331 }
3332
3333 if((len == 0) || got_eof) {
3334 gfud->webdata = g_realloc(gfud->webdata, gfud->len + 1);
3335 gfud->webdata[gfud->len] = '\0';
3336
3337 gfud->callback(gfud, gfud->user_data, gfud->webdata, gfud->len, NULL);
3338 gaim_util_fetch_url_cancel(gfud);
3339 }
3340 }
3341
3342 static void
3343 url_fetch_send_cb(gpointer data, gint source, GaimInputCondition cond)
3344 {
3345 GaimUtilFetchUrlData *gfud;
3346 int len, total_len;
3347
3348 gfud = data;
3349
3350 total_len = strlen(gfud->request);
3351
3352 len = write(gfud->fd, gfud->request + gfud->request_written,
3353 total_len - gfud->request_written);
3354
3355 if (len < 0 && errno == EAGAIN)
3356 return;
3357 else if (len < 0) {
3358 gaim_util_fetch_url_error(gfud, _("Error writing to %s: %s"),
3359 gfud->website.address, strerror(errno));
3360 return;
3361 }
3362 gfud->request_written += len;
3363
3364 if (gfud->request_written != total_len)
3365 return;
3366
3367 /* We're done writing our request, now start reading the response */
3368 gaim_input_remove(gfud->inpa);
3369 gfud->inpa = gaim_input_add(gfud->fd, GAIM_INPUT_READ, url_fetch_recv_cb,
3370 gfud);
3371 }
3372
3373 static void
3374 url_fetch_connect_cb(gpointer url_data, gint source, const gchar *error_message)
3375 {
3376 GaimUtilFetchUrlData *gfud;
3377
3378 gfud = url_data;
3379 gfud->connect_data = NULL;
3380
3381 if (source == -1)
3382 {
3383 gaim_util_fetch_url_error(gfud, _("Unable to connect to %s: %s"),
3384 (gfud->website.address ? gfud->website.address : ""), error_message);
3385 return;
3386 }
3387
3388 gfud->fd = source;
3389
3390 if (!gfud->request)
3391 {
3392 if (gfud->user_agent) {
3393 /* Host header is not forbidden in HTTP/1.0 requests, and HTTP/1.1
3394 * clients must know how to handle the "chunked" transfer encoding.
3395 * Gaim doesn't know how to handle "chunked", so should always send
3396 * the Host header regardless, to get around some observed problems
3397 */
3398 gfud->request = g_strdup_printf(
3399 "GET %s%s HTTP/%s\r\n"
3400 "Connection: close\r\n"
3401 "User-Agent: %s\r\n"
3402 "Accept: */*\r\n"
3403 "Host: %s\r\n\r\n",
3404 (gfud->full ? "" : "/"),
3405 (gfud->full ? (gfud->url ? gfud->url : "") : (gfud->website.page ? gfud->website.page : "")),
3406 (gfud->http11 ? "1.1" : "1.0"),
3407 (gfud->user_agent ? gfud->user_agent : ""),
3408 (gfud->website.address ? gfud->website.address : ""));
3409 } else {
3410 gfud->request = g_strdup_printf(
3411 "GET %s%s HTTP/%s\r\n"
3412 "Connection: close\r\n"
3413 "Accept: */*\r\n"
3414 "Host: %s\r\n\r\n",
3415 (gfud->full ? "" : "/"),
3416 (gfud->full ? (gfud->url ? gfud->url : "") : (gfud->website.page ? gfud->website.page : "")),
3417 (gfud->http11 ? "1.1" : "1.0"),
3418 (gfud->website.address ? gfud->website.address : ""));
3419 }
3420 }
3421
3422 gaim_debug_misc("util", "Request: '%s'\n", gfud->request);
3423
3424 gfud->inpa = gaim_input_add(source, GAIM_INPUT_WRITE,
3425 url_fetch_send_cb, gfud);
3426 url_fetch_send_cb(gfud, source, GAIM_INPUT_WRITE);
3427 }
3428
3429 GaimUtilFetchUrlData *
3430 gaim_util_fetch_url_request(const char *url, gboolean full,
3431 const char *user_agent, gboolean http11,
3432 const char *request, gboolean include_headers,
3433 GaimUtilFetchUrlCallback callback, void *user_data)
3434 {
3435 GaimUtilFetchUrlData *gfud;
3436
3437 g_return_val_if_fail(url != NULL, NULL);
3438 g_return_val_if_fail(callback != NULL, NULL);
3439
3440 gaim_debug_info("util",
3441 "requested to fetch (%s), full=%d, user_agent=(%s), http11=%d\n",
3442 url, full, user_agent?user_agent:"(null)", http11);
3443
3444 gfud = g_new0(GaimUtilFetchUrlData, 1);
3445
3446 gfud->callback = callback;
3447 gfud->user_data = user_data;
3448 gfud->url = g_strdup(url);
3449 gfud->user_agent = g_strdup(user_agent);
3450 gfud->http11 = http11;
3451 gfud->full = full;
3452 gfud->request = g_strdup(request);
3453 gfud->include_headers = include_headers;
3454
3455 gaim_url_parse(url, &gfud->website.address, &gfud->website.port,
3456 &gfud->website.page, &gfud->website.user, &gfud->website.passwd);
3457
3458 gfud->connect_data = gaim_proxy_connect(NULL, NULL,
3459 gfud->website.address, gfud->website.port,
3460 url_fetch_connect_cb, gfud);
3461
3462 if (gfud->connect_data == NULL)
3463 {
3464 gaim_util_fetch_url_error(gfud, _("Unable to connect to %s"),
3465 gfud->website.address);
3466 return NULL;
3467 }
3468
3469 return gfud;
3470 }
3471
3472 void
3473 gaim_util_fetch_url_cancel(GaimUtilFetchUrlData *gfud)
3474 {
3475 if (gfud->connect_data != NULL)
3476 gaim_proxy_connect_cancel(gfud->connect_data);
3477
3478 if (gfud->inpa > 0)
3479 gaim_input_remove(gfud->inpa);
3480
3481 if (gfud->fd >= 0)
3482 close(gfud->fd);
3483
3484 g_free(gfud->website.user);
3485 g_free(gfud->website.passwd);
3486 g_free(gfud->website.address);
3487 g_free(gfud->website.page);
3488 g_free(gfud->url);
3489 g_free(gfud->user_agent);
3490 g_free(gfud->request);
3491 g_free(gfud->webdata);
3492
3493 g_free(gfud);
3494 }
3495
3496 const char *
3497 gaim_url_decode(const char *str)
3498 {
3499 static char buf[BUF_LEN];
3500 guint i, j = 0;
3501 char *bum;
3502 char hex[3];
3503
3504 g_return_val_if_fail(str != NULL, NULL);
3505
3506 /*
3507 * XXX - This check could be removed and buf could be made
3508 * dynamically allocated, but this is easier.
3509 */
3510 if (strlen(str) >= BUF_LEN)
3511 return NULL;
3512
3513 for (i = 0; i < strlen(str); i++) {
3514
3515 if (str[i] != '%')
3516 buf[j++] = str[i];
3517 else {
3518 strncpy(hex, str + ++i, 2);
3519 hex[2] = '\0';
3520
3521 /* i is pointing to the start of the number */
3522 i++;
3523
3524 /*
3525 * Now it's at the end and at the start of the for loop
3526 * will be at the next character.
3527 */
3528 buf[j++] = strtol(hex, NULL, 16);
3529 }
3530 }
3531
3532 buf[j] = '\0';
3533
3534 if (!g_utf8_validate(buf, -1, (const char **)&bum))
3535 *bum = '\0';
3536
3537 return buf;
3538 }
3539
3540 const char *
3541 gaim_url_encode(const char *str)
3542 {
3543 const char *iter;
3544 static char buf[BUF_LEN];
3545 char utf_char[6];
3546 guint i, j = 0;
3547
3548 g_return_val_if_fail(str != NULL, NULL);
3549 g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
3550
3551 iter = str;
3552 for (; *iter && j < (BUF_LEN - 1) ; iter = g_utf8_next_char(iter)) {
3553 gunichar c = g_utf8_get_char(iter);
3554 /* If the character is an ASCII character and is alphanumeric
3555 * no need to escape */
3556 if (c < 128 && isalnum(c)) {
3557 buf[j++] = c;
3558 } else {
3559 int bytes = g_unichar_to_utf8(c, utf_char);
3560 for (i = 0; i < bytes; i++) {
3561 if (j > (BUF_LEN - 4))
3562 break;
3563 sprintf(buf + j, "%%%02x", utf_char[i] & 0xff);
3564 j += 3;
3565 }
3566 }
3567 }
3568
3569 buf[j] = '\0';
3570
3571 return buf;
3572 }
3573
3574 /* Originally lifted from
3575 * http://www.oreillynet.com/pub/a/network/excerpt/spcookbook_chap03/index3.html
3576 * ... and slightly modified to be a bit more rfc822 compliant
3577 * ... and modified a bit more to make domain checking rfc1035 compliant
3578 * with the exception permitted in rfc1101 for domains to start with digit
3579 * but not completely checking to avoid conflicts with IP addresses
3580 */
3581 gboolean
3582 gaim_email_is_valid(const char *address)
3583 {
3584 const char *c, *domain;
3585 static char *rfc822_specials = "()<>@,;:\\\"[]";
3586
3587 /* first we validate the name portion (name@domain) (rfc822)*/
3588 for (c = address; *c; c++) {
3589 if (*c == '\"' && (c == address || *(c - 1) == '.' || *(c - 1) == '\"')) {
3590 while (*++c) {
3591 if (*c == '\\') {
3592 if (*c++ && *c < 127 && *c != '\n' && *c != '\r') continue;
3593 else return FALSE;
3594 }
3595 if (*c == '\"') break;
3596 if (*c < ' ' || *c >= 127) return FALSE;
3597 }
3598 if (!*c++) return FALSE;
3599 if (*c == '@') break;
3600 if (*c != '.') return FALSE;
3601 continue;
3602 }
3603 if (*c == '@') break;
3604 if (*c <= ' ' || *c >= 127) return FALSE;
3605 if (strchr(rfc822_specials, *c)) return FALSE;
3606 }
3607 /* strictly we should return false if (*(c - 1) == '.') too, but I think
3608 * we should permit user.@domain type addresses - they do work :) */
3609 if (c == address) return FALSE;
3610
3611 /* next we validate the domain portion (name@domain) (rfc1035 & rfc1011) */
3612 if (!*(domain = ++c)) return FALSE;
3613 do {
3614 if (*c == '.' && (c == domain || *(c - 1) == '.' || *(c - 1) == '-'))
3615 return FALSE;
3616 if (*c == '-' && *(c - 1) == '.') return FALSE;
3617 if ((*c < '0' && *c != '-' && *c != '.') || (*c > '9' && *c < 'A') ||
3618 (*c > 'Z' && *c < 'a') || (*c > 'z')) return FALSE;
3619 } while (*++c);
3620
3621 if (*(c - 1) == '-') return FALSE;
3622
3623 return ((c - domain) > 3 ? TRUE : FALSE);
3624 }
3625
3626 /* Stolen from gnome_uri_list_extract_uris */
3627 GList *
3628 gaim_uri_list_extract_uris(const gchar *uri_list)
3629 {
3630 const gchar *p, *q;
3631 gchar *retval;
3632 GList *result = NULL;
3633
3634 g_return_val_if_fail (uri_list != NULL, NULL);
3635
3636 p = uri_list;
3637
3638 /* We don't actually try to validate the URI according to RFC
3639 * 2396, or even check for allowed characters - we just ignore
3640 * comments and trim whitespace off the ends. We also
3641 * allow LF delimination as well as the specified CRLF.
3642 */
3643 while (p) {
3644 if (*p != '#') {
3645 while (isspace(*p))
3646 p++;
3647
3648 q = p;
3649 while (*q && (*q != '\n') && (*q != '\r'))
3650 q++;
3651
3652 if (q > p) {
3653 q--;
3654 while (q > p && isspace(*q))
3655 q--;
3656
3657 retval = (gchar*)g_malloc (q - p + 2);
3658 strncpy (retval, p, q - p + 1);
3659 retval[q - p + 1] = '\0';
3660
3661 result = g_list_prepend (result, retval);
3662 }
3663 }
3664 p = strchr (p, '\n');
3665 if (p)
3666 p++;
3667 }
3668
3669 return g_list_reverse (result);
3670 }
3671
3672
3673 /* Stolen from gnome_uri_list_extract_filenames */
3674 GList *
3675 gaim_uri_list_extract_filenames(const gchar *uri_list)
3676 {
3677 GList *tmp_list, *node, *result;
3678
3679 g_return_val_if_fail (uri_list != NULL, NULL);
3680
3681 result = gaim_uri_list_extract_uris(uri_list);
3682
3683 tmp_list = result;
3684 while (tmp_list) {
3685 gchar *s = (gchar*)tmp_list->data;
3686
3687 node = tmp_list;
3688 tmp_list = tmp_list->next;
3689
3690 if (!strncmp (s, "file:", 5)) {
3691 node->data = g_filename_from_uri (s, NULL, NULL);
3692 /* not sure if this fallback is useful at all */
3693 if (!node->data) node->data = g_strdup (s+5);
3694 } else {
3695 result = g_list_remove_link(result, node);
3696 g_list_free_1 (node);
3697 }
3698 g_free (s);
3699 }
3700 return result;
3701 }
3702
3703 /**************************************************************************
3704 * UTF8 String Functions
3705 **************************************************************************/
3706 gchar *
3707 gaim_utf8_try_convert(const char *str)
3708 {
3709 gsize converted;
3710 gchar *utf8;
3711
3712 g_return_val_if_fail(str != NULL, NULL);
3713
3714 if (g_utf8_validate(str, -1, NULL)) {
3715 return g_strdup(str);
3716 }
3717
3718 utf8 = g_locale_to_utf8(str, -1, &converted, NULL, NULL);
3719 if (utf8 != NULL)
3720 return utf8;
3721
3722 utf8 = g_convert(str, -1, "UTF-8", "ISO-8859-15", &converted, NULL, NULL);
3723 if ((utf8 != NULL) && (converted == strlen(str)))
3724 return utf8;
3725
3726 g_free(utf8);
3727
3728 return NULL;
3729 }
3730
3731 #define utf8_first(x) ((x & 0x80) == 0 || (x & 0xe0) == 0xc0 \
3732 || (x & 0xf0) == 0xe0 || (x & 0xf8) == 0xf)
3733 gchar *
3734 gaim_utf8_salvage(const char *str)
3735 {
3736 GString *workstr;
3737 const char *end;
3738
3739 g_return_val_if_fail(str != NULL, NULL);
3740
3741 workstr = g_string_sized_new(strlen(str));
3742
3743 do {
3744 g_utf8_validate(str, -1, &end);
3745 workstr = g_string_append_len(workstr, str, end - str);
3746 str = end;
3747 if (*str == '\0')
3748 break;
3749 do {
3750 workstr = g_string_append_c(workstr, '?');
3751 str++;
3752 } while (!utf8_first(*str));
3753 } while (*str != '\0');
3754
3755 return g_string_free(workstr, FALSE);
3756 }
3757
3758
3759 char *
3760 gaim_utf8_ncr_encode(const char *str)
3761 {
3762 GString *out;
3763
3764 g_return_val_if_fail(str != NULL, NULL);
3765 g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
3766
3767 out = g_string_new("");
3768
3769 for(; *str; str = g_utf8_next_char(str)) {
3770 gunichar wc = g_utf8_get_char(str);
3771
3772 /* super simple check. hopefully not too wrong. */
3773 if(wc >= 0x80) {
3774 g_string_append_printf(out, "&#%u;", (guint32) wc);
3775 } else {
3776 g_string_append_unichar(out, wc);
3777 }
3778 }
3779
3780 return g_string_free(out, FALSE);
3781 }
3782
3783
3784 char *
3785 gaim_utf8_ncr_decode(const char *str)
3786 {
3787 GString *out;
3788 char *buf, *b;
3789
3790 g_return_val_if_fail(str != NULL, NULL);
3791 g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
3792
3793 buf = (char *) str;
3794 out = g_string_new("");
3795
3796 while( (b = strstr(buf, "&#")) ) {
3797 gunichar wc;
3798 int base = 0;
3799
3800 /* append everything leading up to the &# */
3801 g_string_append_len(out, buf, b-buf);
3802
3803 b += 2; /* skip past the &# */
3804
3805 /* strtoul will treat 0x prefix as hex, but not just x */
3806 if(*b == 'x' || *b == 'X') {
3807 base = 16;
3808 b++;
3809 }
3810
3811 /* advances buf to the end of the ncr segment */
3812 wc = (gunichar) strtoul(b, &buf, base);
3813
3814 /* this mimics the previous impl of ncr_decode */
3815 if(*buf == ';') {
3816 g_string_append_unichar(out, wc);
3817 buf++;
3818 }
3819 }
3820
3821 /* append whatever's left */
3822 g_string_append(out, buf);
3823
3824 return g_string_free(out, FALSE);
3825 }
3826
3827
3828 int
3829 gaim_utf8_strcasecmp(const char *a, const char *b)
3830 {
3831 char *a_norm = NULL;
3832 char *b_norm = NULL;
3833 int ret = -1;
3834
3835 if(!a && b)
3836 return -1;
3837 else if(!b && a)
3838 return 1;
3839 else if(!a && !b)
3840 return 0;
3841
3842 if(!g_utf8_validate(a, -1, NULL) || !g_utf8_validate(b, -1, NULL))
3843 {
3844 gaim_debug_error("gaim_utf8_strcasecmp",
3845 "One or both parameters are invalid UTF8\n");
3846 return ret;
3847 }
3848
3849 a_norm = g_utf8_casefold(a, -1);
3850 b_norm = g_utf8_casefold(b, -1);
3851 ret = g_utf8_collate(a_norm, b_norm);
3852 g_free(a_norm);
3853 g_free(b_norm);
3854
3855 return ret;
3856 }
3857
3858 /* previously conversation::find_nick() */
3859 gboolean
3860 gaim_utf8_has_word(const char *haystack, const char *needle)
3861 {
3862 char *hay, *pin, *p;
3863 int n;
3864 gboolean ret = FALSE;
3865
3866 hay = g_utf8_strdown(haystack, -1);
3867
3868 pin = g_utf8_strdown(needle, -1);
3869 n = strlen(pin);
3870
3871 if ((p = strstr(hay, pin)) != NULL) {
3872 if ((p == hay || !isalnum(*(p - 1))) && !isalnum(*(p + n))) {
3873 ret = TRUE;
3874 }
3875 }
3876
3877 g_free(pin);
3878 g_free(hay);
3879
3880 return ret;
3881 }
3882
3883 void
3884 gaim_print_utf8_to_console(FILE *filestream, char *message)
3885 {
3886 gchar *message_conv;
3887 GError *error = NULL;
3888
3889 /* Try to convert 'message' to user's locale */
3890 message_conv = g_locale_from_utf8(message, -1, NULL, NULL, &error);
3891 if (message_conv != NULL) {
3892 fputs(message_conv, filestream);
3893 g_free(message_conv);
3894 }
3895 else
3896 {
3897 /* use 'message' as a fallback */
3898 g_warning("%s\n", error->message);
3899 g_error_free(error);
3900 fputs(message, filestream);
3901 }
3902 }
3903
3904 gboolean gaim_message_meify(char *message, size_t len)
3905 {
3906 char *c;
3907 gboolean inside_html = FALSE;
3908
3909 g_return_val_if_fail(message != NULL, FALSE);
3910
3911 if(len == -1)
3912 len = strlen(message);
3913
3914 for (c = message; *c; c++, len--) {
3915 if(inside_html) {
3916 if(*c == '>')
3917 inside_html = FALSE;
3918 } else {
3919 if(*c == '<')
3920 inside_html = TRUE;
3921 else
3922 break;
3923 }
3924 }
3925
3926 if(*c && !g_ascii_strncasecmp(c, "/me ", 4)) {
3927 memmove(c, c+4, len-3);
3928 return TRUE;
3929 }
3930
3931 return FALSE;
3932 }
3933
3934 char *gaim_text_strip_mnemonic(const char *in)
3935 {
3936 char *out;
3937 char *a;
3938 char *a0;
3939 const char *b;
3940
3941 g_return_val_if_fail(in != NULL, NULL);
3942
3943 out = g_malloc(strlen(in)+1);
3944 a = out;
3945 b = in;
3946
3947 a0 = a; /* The last non-space char seen so far, or the first char */
3948
3949 while(*b) {
3950 if(*b == '_') {
3951 if(a > out && b > in && *(b-1) == '(' && *(b+1) && !(*(b+1) & 0x80) && *(b+2) == ')') {
3952 /* Detected CJK style shortcut (Bug 875311) */
3953 a = a0; /* undo the left parenthesis */
3954 b += 3; /* and skip the whole mess */
3955 } else if(*(b+1) == '_') {
3956 *(a++) = '_';
3957 b += 2;
3958 a0 = a;
3959 } else {
3960 b++;
3961 }
3962 /* We don't want to corrupt the middle of UTF-8 characters */
3963 } else if (!(*b & 0x80)) { /* other 1-byte char */
3964 if (*b != ' ')
3965 a0 = a;
3966 *(a++) = *(b++);
3967 } else {
3968 /* Multibyte utf8 char, don't look for _ inside these */
3969 int n = 0;
3970 int i;
3971 if ((*b & 0xe0) == 0xc0) {
3972 n = 2;
3973 } else if ((*b & 0xf0) == 0xe0) {
3974 n = 3;
3975 } else if ((*b & 0xf8) == 0xf0) {
3976 n = 4;
3977 } else if ((*b & 0xfc) == 0xf8) {
3978 n = 5;
3979 } else if ((*b & 0xfe) == 0xfc) {
3980 n = 6;
3981 } else { /* Illegal utf8 */
3982 n = 1;
3983 }
3984 a0 = a; /* unless we want to delete CJK spaces too */
3985 for (i = 0; i < n && *b; i += 1) {
3986 *(a++) = *(b++);
3987 }
3988 }
3989 }
3990 *a = '\0';
3991
3992 return out;
3993 }
3994
3995 const char* gaim_unescape_filename(const char *escaped) {
3996 return gaim_url_decode(escaped);
3997 }
3998
3999
4000 /* this is almost identical to gaim_url_encode (hence gaim_url_decode
4001 * being used above), but we want to keep certain characters unescaped
4002 * for compat reasons */
4003 const char *
4004 gaim_escape_filename(const char *str)
4005 {
4006 const char *iter;
4007 static char buf[BUF_LEN];
4008 char utf_char[6];
4009 guint i, j = 0;
4010
4011 g_return_val_if_fail(str != NULL, NULL);
4012 g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
4013
4014 iter = str;
4015 for (; *iter && j < (BUF_LEN - 1) ; iter = g_utf8_next_char(iter)) {
4016 gunichar c = g_utf8_get_char(iter);
4017 /* If the character is an ASCII character and is alphanumeric,
4018 * or one of the specified values, no need to escape */
4019 if (c < 128 && (isalnum(c) || c == '@' || c == '-' ||
4020 c == '_' || c == '.' || c == '#')) {
4021 buf[j++] = c;
4022 } else {
4023 int bytes = g_unichar_to_utf8(c, utf_char);
4024 for (i = 0; i < bytes; i++) {
4025 if (j > (BUF_LEN - 4))
4026 break;
4027 sprintf(buf + j, "%%%02x", utf_char[i] & 0xff);
4028 j += 3;
4029 }
4030 }
4031 }
4032
4033 buf[j] = '\0';
4034
4035 return buf;
4036 }
4037