(Fsubst_char_in_region): Correctly handle the case

that byte combining before happens. (Ftranslate_region): Likewise.
author: Kenichi Handa 1998-10-27 03:54:13 +0000
committer: Kenichi Handa 1998-10-27 03:54:13 +0000
commit: a3360ff9150045b8e379bfc856c47ba872ddb0ce (patch)
tree: daf8e0edcba4553b2625d1caeb6a5e6872c50725 /src
parent: b413f89564f18ef411c8fe8f4ec157e41c29c01d (diff)
download: emacs-a3360ff9150045b8e379bfc856c47ba872ddb0ce.tar.gz
emacs-a3360ff9150045b8e379bfc856c47ba872ddb0ce.zip
1 files changed, 69 insertions, 29 deletions
diff --git a/src/editfns.c b/src/editfns.c
index a0c09ebf095..b6302ca05f2 100644
--- a/src/editfns.c
+++ b/src/editfns.c
@@ -1938,6 +1938,7 @@ Both characters must have the same length of multi-byte form.")
  int changed = 0;
  unsigned char fromwork[4], *fromstr, towork[4], *tostr, *p;
  int count = specpdl_ptr - specpdl;
+  int maybe_byte_combining = 0;
  validate_region (&start, &end);
  CHECK_NUMBER (fromchar, 2);
@@ -1948,6 +1949,11 @@ Both characters must have the same length of multi-byte form.")
      len = CHAR_STRING (XFASTINT (fromchar), fromwork, fromstr);
      if (CHAR_STRING (XFASTINT (tochar), towork, tostr) != len)
        error ("Characters in subst-char-in-region have different byte-lengths");
+      if (len == 1)
+        /* If *TOSTR is in the range 0x80..0x9F, it may be combined
+           with the after bytes.  If it is in the range 0xA0..0xFF, it
+           may be combined with the before bytes.  */
+        maybe_byte_combining = !ASCII_BYTE_P (*tostr);
    }
  else
    {
@@ -1980,13 +1986,17 @@ Both characters must have the same length of multi-byte form.")
    stop = min (stop, GPT_BYTE);
  while (1)
    {
+      int pos_byte_next = pos_byte;
      if (pos_byte >= stop)
        {
          if (pos_byte >= end_byte) break;
          stop = end_byte;
        }
      p = BYTE_POS_ADDR (pos_byte);
-      if (p[0] == fromstr[0]
+      INC_POS (pos_byte_next);
+      if (pos_byte_next - pos_byte == len
+          && p[0] == fromstr[0]
          && (len == 1
              || (p[1] == fromstr[1]
                  && (len == 2 || (p[2] == fromstr[2]
@@ -2009,14 +2019,11 @@ Both characters must have the same length of multi-byte form.")
          /* Take care of the case where the new character
             combines with neighboring bytes.  */ 
-          if (len == 1
+          if (maybe_byte_combining
-              && ((! CHAR_HEAD_P (tostr[0])
+              && (CHAR_HEAD_P (*tostr)
-                   && pos_byte > BEGV_BYTE
+                  ? ! CHAR_HEAD_P (FETCH_BYTE (pos_byte + 1))
-                   && ! ASCII_BYTE_P (FETCH_BYTE (pos_byte - 1)))
+                  : (pos_byte > BEGV_BYTE
-                  ||
+                     && ! ASCII_BYTE_P (FETCH_BYTE (pos_byte - 1)))))
-                  (! ASCII_BYTE_P (tostr[0])
-                   && pos_byte + 1 < ZV_BYTE
-                   && ! CHAR_HEAD_P (FETCH_BYTE (pos_byte + 1)))))
            {
              Lisp_Object tem, string;
@@ -2025,15 +2032,24 @@ Both characters must have the same length of multi-byte form.")
              tem = current_buffer->undo_list;
              GCPRO1 (tem);
-              /* Make a multibyte string containing this
+              /* Make a multibyte string containing this single-byte
-                 single-byte character.  */
+                  character.  */
-              string = Fmake_string (make_number (1),
+              string = make_multibyte_string (tostr, 1, 1);
-                                     make_number (tochar));
-              SET_STRING_BYTES (XSTRING (string), 1);
              /* replace_range is less efficient, because it moves the gap,
                 but it handles combining correctly.  */
              replace_range (pos, pos + 1, string,
                             0, 0, 1);
+              pos_byte_next = CHAR_TO_BYTE (pos);
+              if (pos_byte_next > pos_byte)
+                /* Before combining happened.  We should not increment
+                   POS because now it points the next character.  */
+                pos_byte = pos_byte_next;
+              else
+                {
+                  pos++;
+                  INC_POS (pos_byte_next);
+                }
+                
              if (! NILP (noundo))
                current_buffer->undo_list = tem;
@@ -2044,9 +2060,15 @@ Both characters must have the same length of multi-byte form.")
              if (NILP (noundo))
                record_change (pos, 1);
              for (i = 0; i < len; i++) *p++ = tostr[i];
+              pos_byte = pos_byte_next;
+              pos++;
            }
        }
-      INC_BOTH (pos, pos_byte);
+      else
+        {
+          pos_byte = pos_byte_next;
+          pos++;
+        }
    }
  if (changed)
@@ -2092,8 +2114,10 @@ It returns the number of characters changed.")
      register unsigned char *p = BYTE_POS_ADDR (pos_byte);
      int len;
      int oc;
+      int pos_byte_next;
      oc = STRING_CHAR_AND_LENGTH (p, stop - pos_byte, len);
+      pos_byte_next = pos_byte + len;
      if (oc < size && len == 1)
        {
          nc = tt[oc];
@@ -2101,36 +2125,52 @@ It returns the number of characters changed.")
            {
              /* Take care of the case where the new character
                 combines with neighboring bytes.  */ 
-              if ((! CHAR_HEAD_P (nc)
+              if (!ASCII_BYTE_P (nc)
-                   && pos_byte > BEGV_BYTE
+                  && (CHAR_HEAD_P (nc)
-                   && ! ASCII_BYTE_P (FETCH_BYTE (pos_byte - 1)))
+                      ? ! CHAR_HEAD_P (FETCH_BYTE (pos_byte + 1))
-                  ||
+                      : (pos_byte > BEGV_BYTE
-                  (! ASCII_BYTE_P (nc)
+                         && ! ASCII_BYTE_P (FETCH_BYTE (pos_byte - 1)))))
-                   && pos_byte + 1 < ZV_BYTE
-                   && ! CHAR_HEAD_P (FETCH_BYTE (pos_byte + 1))))
                {
                  Lisp_Object string;
-                  string = Fmake_string (make_number (1),
+                  string = make_multibyte_string (tt + oc, 1, 1);
-                                         make_number (nc));
-                  SET_STRING_BYTES (XSTRING (string), 1);
                  /* This is less efficient, because it moves the gap,
                     but it handles combining correctly.  */
                  replace_range (pos, pos + 1, string,
-                                 1, 0, 0);
+                                 1, 0, 1);
+                  pos_byte_next = CHAR_TO_BYTE (pos);
+                  if (pos_byte_next > pos_byte)
+                    /* Before combining happened.  We should not
+                       increment POS because now it points the next
+                       character.  */
+                    pos_byte = pos_byte_next;
+                  else
+                    {
+                      pos++;
+                      INC_POS (pos_byte_next);
+                    }
                }
              else
                {
                  record_change (pos, 1);
                  *p = nc;
                  signal_after_change (pos, 1, 1);
+                  pos_byte++;
+                  pos++;
                }
              ++cnt;
            }
+          else
+            {
+              pos_byte++;
+              pos++;
+            }
+        }
+      else
+        {
+          pos_byte += len;
+          pos++;
        }
-      pos_byte += len;
-      pos++;
    }
  return make_number (cnt);
author	Kenichi Handa	1998-10-27 03:54:13 +0000
committer	Kenichi Handa	1998-10-27 03:54:13 +0000
commit	a3360ff9150045b8e379bfc856c47ba872ddb0ce (patch)
tree	daf8e0edcba4553b2625d1caeb6a5e6872c50725 /src
parent	b413f89564f18ef411c8fe8f4ec157e41c29c01d (diff)
download	emacs-a3360ff9150045b8e379bfc856c47ba872ddb0ce.tar.gz emacs-a3360ff9150045b8e379bfc856c47ba872ddb0ce.zip