emacs: src/coding.c comparison

comparison src/coding.c @ 21744:64c815fe1bdc

(shrink_decoding_region): Do not consider LF as ascii if preceded by CR, since that confuses eol decoding. (code_convert_region): When conversion fails with CODING_FINISH_INSUFFICIENT_SRC, was overwriting src with garbage from dst instead of copying from src to dst.

author	Richard M. Stallman <rms@gnu.org>
date	Fri, 24 Apr 1998 01:05:25 +0000
parents	4097e558fa19
children	376ce06ab12d

comparison

equal deleted inserted replaced

-:8def83521606
+:64c815fe1bdc
 case coding_type_raw_text:
 if (eol_conversion)
 	{
 	  if (coding->heading_ascii < 0)
 	    while (begp < endp && *begp != '\r' && *begp < 0x80) begp++;
-	  while (begp < endp && *(endp - 1) != '\r' && *(endp - 1) < 0x80)
+	  while (begp < endp && endp[-1] != '\r' && endp[-1] < 0x80)
 	    endp--;
+	  /* Do not consider LF as ascii if preceded by CR, since that
+confuses eol decoding. */
+	  if (begp < endp && endp < endp_orig && endp[-1] == '\r' && endp[0] == '\n')
+	    endp++;
 	}
 else
 	begp = endp;
 break;
 	 second byte of SJIS or BIG5 code.  */
 if (eol_conversion)
 	while (begp < endp && endp[-1] < 0x80 && endp[-1] != '\r') endp--;
 else
 	while (begp < endp && endp[-1] < 0x80) endp--;
+/* Do not consider LF as ascii if preceded by CR, since that
+	 confuses eol decoding. */
+if (begp < endp && endp < endp_orig && endp[-1] == '\r' && endp[0] == '\n')
+	endp++;
 if (begp < endp && endp < endp_orig && endp[-1] >= 0x80)
 	endp++;
 break;
 default:		/* i.e. case coding_type_iso2022: */
 	  /* We can skip all ASCII characters at the tail.  */
 	  if (eol_conversion)
 	    while (begp < endp && (c = endp[-1]) < 0x80 && c != '\r') endp--;
 	  else
 	    while (begp < endp && endp[-1] < 0x80) endp--;
+	  /* Do not consider LF as ascii if preceded by CR, since that
+confuses eol decoding. */
+	  if (begp < endp && endp < endp_orig && endp[-1] == '\r' && endp[0] == '\n')
+	    endp++;
 	  break;
 	case CODING_CATEGORY_IDX_ISO_7:
 	case CODING_CATEGORY_IDX_ISO_7_TIGHT:
 	  /* We can skip all charactes at the tail except for ESC and
 	      endp--;
 	  else
 	    while (begp < endp
 		   && (c = endp[-1]) < 0x80 && c != ISO_CODE_ESC)
 	      endp--;
+	  /* Do not consider LF as ascii if preceded by CR, since that
+confuses eol decoding. */
+	  if (begp < endp && endp < endp_orig && endp[-1] == '\r' && endp[0] == '\n')
+	    endp++;
 	  if (begp < endp && endp[-1] == ISO_CODE_ESC)
 	    {
 	      if (endp + 1 < endp_orig && end[0] == '(' && end[1] == 'B')
 		/* This is an ASCII designation sequence.  We can
 surely skip the tail.  */
 	  /* The source text ends in invalid codes.  Let's just
 	     make them valid buffer contents, and finish conversion.  */
 	  inserted += len_byte;
 	  inserted_byte += len_byte;
 	  while (len_byte--)
-	    *src++ = *dst++;
+	    *dst++ = *src++;
 	  fake_multibyte = 1;
 	  break;
 	}
 if (first)
 	{

Mercurial > emacs

comparison src/coding.c @ 21744:64c815fe1bdc