emacs: src/coding.c comparison

comparison src/coding.c @ 72395:94e4795b333d

(ONE_MORE_BYTE_CHECK_MULTIBYTE): New arg RET. If SRC is exhausted, return with RET. (detect_coding_emacs_mule, detect_coding_iso2022) (detect_coding_sjis, detect_coding_big5, detect_coding_utf_8) (detect_coding_utf_16, detect_coding_ccl): Adjusted for the above change.

author	Kenichi Handa <handa@m17n.org>
date	Tue, 15 Aug 2006 02:41:29 +0000
parents	af796bc81ff0
children	6493d4697ad2 694bbb62a75d

comparison

equal deleted inserted replaced

-:bec9a701aee6
+:94e4795b333d
 c2 = *src++;						\
 } while (0)
 /* Like ONE_MORE_BYTE, but 8-bit bytes of data at SRC are in multibyte
-form if MULTIBYTEP is nonzero.  */
+form if MULTIBYTEP is nonzero.  In addition, if SRC is not less
+than SRC_END, return with RET.  */
-#define ONE_MORE_BYTE_CHECK_MULTIBYTE(c1, multibytep)		\
+#define ONE_MORE_BYTE_CHECK_MULTIBYTE(c1, multibytep, ret)	\
 do {								\
 if (src >= src_end)						\
 {								\
 	coding->result = CODING_FINISH_INSUFFICIENT_SRC;	\
-	goto label_end_of_loop;					\
+	return ret;						\
 }								\
 c1 = *src++;						\
 if (multibytep && c1 == LEADING_CODE_8_BIT_CONTROL)		\
 c1 = *src++ - 0x20;					\
 } while (0)
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
 while (1)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep,
+				     CODING_CATEGORY_MASK_EMACS_MULE);
 if (composing)
 	{
 	  if (c < 0xA0)
 	    composing = 0;
 	  else if (c == 0xA0)
 	    {
-	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, 0);
 	      c &= 0x7F;
 	    }
 	  else
 	    c -= 0x20;
 	}
 		return 0;
 	      src = src_base + bytes;
 	    }
 	}
 }
-label_end_of_loop:
-return CODING_CATEGORY_MASK_EMACS_MULE;
 }
 /* Record the starting position START and METHOD of one composition.  */
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
 Lisp_Object safe_chars;
 reg[0] = CHARSET_ASCII, reg[1] = reg[2] = reg[3] = -1;
-while (mask && src < src_end)
+while (mask)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, mask & mask_found);
 retry:
 switch (c)
 	{
 	case ISO_CODE_ESC:
 	  if (inhibit_iso_escape_detection)
 	    break;
 	  single_shifting = 0;
-	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, mask & mask_found);
 	  if (c >= '(' && c <= '/')
 	    {
 	      /* Designation sequence for a charset of dimension 1.  */
-	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep);
+	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep, mask & mask_found);
 	      if (c1 < ' ' || c1 >= 0x80
 		  || (charset = iso_charset_table[0][c >= ','][c1]) < 0)
 		/* Invalid designation sequence.  Just ignore.  */
 		break;
 	      reg[(c - '(') % 4] = charset;
 	    }
 	  else if (c == '$')
 	    {
 	      /* Designation sequence for a charset of dimension 2.  */
-	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+	      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, mask & mask_found);
 	      if (c >= '@' && c <= 'B')
 		/* Designation for JISX0208.1978, GB2312, or JISX0208.  */
 		reg[0] = charset = iso_charset_table[1][0][c];
 	      else if (c >= '(' && c <= '/')
 		{
-		  ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep);
+		  ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep,
+						 mask & mask_found);
 		  if (c1 < ' ' || c1 >= 0x80
 		      || (charset = iso_charset_table[1][c >= ','][c1]) < 0)
 		    /* Invalid designation sequence.  Just ignore.  */
 		    break;
 		  reg[(c - '(') % 4] = charset;
 		  int i = 1;
 		  c = -1;
 		  while (src < src_end)
 		    {
-		      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+		      ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep,
+						     mask & mask_found);
 		      if (c < 0xA0)
 			break;
 		      i++;
 		    }
 		}
 	    }
 	  break;
 	}
 }
-label_end_of_loop:
 return (mask & mask_found);
 }
 /* Decode a character of which charset is CHARSET, the 1st position
 code is C1, the 2nd position code is C2, and return the decoded
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
 while (1)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, CODING_CATEGORY_MASK_SJIS);
 if (c < 0x80)
 	continue;
 if (c == 0x80 || c == 0xA0 || c > 0xEF)
 	return 0;
 if (c <= 0x9F || c >= 0xE0)
 	{
-	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, 0);
 	  if (c < 0x40 || c == 0x7F || c > 0xFC)
 	    return 0;
 	}
 }
-label_end_of_loop:
-return CODING_CATEGORY_MASK_SJIS;
 }
 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
 Check if a text is encoded in BIG5.  If it is, return
 CODING_CATEGORY_MASK_BIG5, else return 0.  */
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
 while (1)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, CODING_CATEGORY_MASK_BIG5);
 if (c < 0x80)
 	continue;
 if (c < 0xA1 || c > 0xFE)
 	return 0;
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, 0);
 if (c < 0x40 || (c > 0x7F && c < 0xA1) || c > 0xFE)
 	return 0;
 }
-label_end_of_loop:
-return CODING_CATEGORY_MASK_BIG5;
 }
 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
 Check if a text is encoded in UTF-8.  If it is, return
 CODING_CATEGORY_MASK_UTF_8, else return 0.  */
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
 while (1)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, CODING_CATEGORY_MASK_UTF_8);
 if (UTF_8_1_OCTET_P (c))
 	continue;
 else if (UTF_8_2_OCTET_LEADING_P (c))
 	seq_maybe_bytes = 1;
 else if (UTF_8_3_OCTET_LEADING_P (c))
 else
 	return 0;
 do
 	{
-	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+	  ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, 0);
 	  if (!UTF_8_EXTRA_OCTET_P (c))
 	    return 0;
 	  seq_maybe_bytes--;
 	}
 while (seq_maybe_bytes > 0);
 }
-label_end_of_loop:
-return CODING_CATEGORY_MASK_UTF_8;
 }
 /* See the above "GENERAL NOTES on `detect_coding_XXX ()' functions".
 Check if a text is encoded in UTF-16 Big Endian (endian == 1) or
 Little Endian (otherwise).  If it is, return
 unsigned char c1, c2;
 /* Dummy for ONE_MORE_BYTE_CHECK_MULTIBYTE.  */
 struct coding_system dummy_coding;
 struct coding_system *coding = &dummy_coding;
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c1, multibytep, 0);
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c2, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c2, multibytep, 0);
 if ((c1 == 0xFF) && (c2 == 0xFE))
 return CODING_CATEGORY_MASK_UTF_16_LE;
 else if ((c1 == 0xFE) && (c2 == 0xFF))
 return CODING_CATEGORY_MASK_UTF_16_BE;
-label_end_of_loop:
 return 0;
 }
 /* See the above "GENERAL NOTES on `decode_coding_XXX ()' functions".
 If SJIS_P is 1, decode SJIS text, else decode BIG5 test.  */
 return 0;
 valid = coding_system_table[CODING_CATEGORY_IDX_CCL]->spec.ccl.valid_codes;
 while (1)
 {
-ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep);
+ONE_MORE_BYTE_CHECK_MULTIBYTE (c, multibytep, CODING_CATEGORY_MASK_CCL);
 if (! valid[c])
 	return 0;
 }
-label_end_of_loop:
-return CODING_CATEGORY_MASK_CCL;
 }
 /*** 6. End-of-line handlers ***/

Mercurial > emacs

comparison src/coding.c @ 72395:94e4795b333d