pidgin: src/util.c comparison

comparison src/util.c @ 12880:bad785371fa5

[gaim-migrate @ 15232] reworks gaim_utf8_ncr_decode to handle hex and octal as well as decimal formats. I tested this a bit with sametime, and it seems to be working fine. None of our target platforms are weird and are missing strtoul, I hope... committer: Tailor Script <tailor@pidgin.im>

author	Christopher O'Brien <siege@pidgin.im>
date	Sun, 15 Jan 2006 05:50:28 +0000
parents	547c199072c8
children	4229503f1cd9

comparison

equal deleted inserted replaced

-:f8748df5c17a
+:bad785371fa5
 	return g_string_free(workstr, FALSE);
 }
 char *
-gaim_utf8_ncr_encode(const char *in)
+gaim_utf8_ncr_encode(const char *str)
 {
 	GString *out;
-	g_return_val_if_fail(in != NULL, NULL);
+	g_return_val_if_fail(str != NULL, NULL);
-	g_return_val_if_fail(g_utf8_validate(in, -1, NULL), NULL);
+	g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
 	out = g_string_new("");
-	for(; *in; in = g_utf8_next_char(in)) {
+	for(; *str; str = g_utf8_next_char(str)) {
-		gunichar wc = g_utf8_get_char(in);
+		gunichar wc = g_utf8_get_char(str);
-		if(wc >= 0x80) { /* super simple check. hopefully not too wrong. */
+		/* super simple check. hopefully not too wrong. */
+		if(wc >= 0x80) {
 			g_string_append_printf(out, "&#%u;", (guint32) wc);
 		} else {
 			g_string_append_unichar(out, wc);
 		}
 	}
 	return g_string_free(out, FALSE);
 }
 char *
-gaim_utf8_ncr_decode(const char *in)
+gaim_utf8_ncr_decode(const char *str)
 {
 	GString *out;
-	int i;
+	char *buf, *b;
-	g_return_val_if_fail(in != NULL, NULL);
+	g_return_val_if_fail(str != NULL, NULL);
-	g_return_val_if_fail(g_utf8_validate(in, -1, NULL), NULL);
+	g_return_val_if_fail(g_utf8_validate(str, -1, NULL), NULL);
+	buf = (char *) str;
 	out = g_string_new("");
-	/** @todo doesn't this break with hex formats? */
+	while( (b = strstr(buf, "&#")) ) {
-	for (i = 0; in[i]; i += 1) {
+		gunichar wc;
-		gboolean ncr_found_p = FALSE;
+		int base = 0;
-		if (in[i] == '&' && in[i + 1] == '#' && isdigit(in[i + 2])) {
-			gunichar wc;
+		/* append everything leading up to the &# */
-			int j;
+		g_string_append_len(out, buf, b-buf);
-			for (wc = 0, j = i + 2; isdigit(in[j]); j += 1) {
-				wc *= 10;
+		b += 2; /* skip past the &# */
-				wc += in[j] - '0';
-			}
+		/* strtoul will handle 0x prefix as hex, but not x */
-			if (in[j] == ';') { /* Technically not completely correct */
+		if(*b == 'x' || *b == 'X')
-				g_string_append_unichar(out, wc);
+			base = 16;
-				i = j;
-				ncr_found_p = TRUE;
+		/* advances buf to the end of the ncr segment */
-			}
+		wc = (gunichar) strtoul(b, &buf, base);
-		}
-		if (!ncr_found_p) {
+		/* this mimics the previous impl of ncr_decode */
-			g_string_append_c(out, in[i]);
+		if(*buf == ';') {
-		}
+			g_string_append_unichar(out, wc);
-	}
+			buf++;
+		}
+	}
+	/* append whatever's left */
+	g_string_append(out, buf);
 	return g_string_free(out, FALSE);
 }
 int
 gaim_utf8_strcasecmp(const char *a, const char *b)
 {
 	char *a_norm = NULL;

Mercurial > pidgin

comparison src/util.c @ 12880:bad785371fa5