Fix the tests for 'string-limit'

author Eli Zaretskii <eliz@gnu.org>

Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)

committer Eli Zaretskii <eliz@gnu.org>

Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)
author Eli Zaretskii <eliz@gnu.org>
Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)
committer Eli Zaretskii <eliz@gnu.org>
Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)
diff --git a/lisp/emacs-lisp/subr-x.el b/lisp/emacs-lisp/subr-x.el

index 9c8c967ee9c0cdeff572ccef9e83b786e957b284..5a8885c04270c7e2eded1f9e6e1bc06cee9d84b7 100644 (file)
--- a/lisp/emacs-lisp/subr-x.el
+++ b/lisp/emacs-lisp/subr-x.el
@@ -289,6 +289,18 @@ than this function."
        (let ((result nil)
              (result-length 0)
              (index (if end (1- (length string)) 0)))
+        ;; FIXME: This implementation, which uses encode-coding-char
+        ;; to encode the string one character at a time, is in general
+        ;; incorrect: coding-systems that produce prefix or suffix
+        ;; bytes, such as ISO-2022-based or UTF-8/16 with BOM, will
+        ;; produce those bytes for each character, instead of just
+        ;; once for the entire string.  encode-coding-char attempts to
+        ;; remove those extra bytes at least in some situations, but
+        ;; it cannot do that in all cases.  And in any case, producing
+        ;; what is supposed to be a UTF-16 or ISO-2022-CN encoded
+        ;; string which lacks the BOM bytes at the beginning and the
+        ;; charset designation sequences at the head and tail of the
+        ;; result will definitely surprise the callers in some cases.
          (while (let ((encoded (encode-coding-char
                                 (aref string index) coding-system)))
                   (and (<= (+ (length encoded) result-length) length)
diff --git a/test/lisp/emacs-lisp/subr-x-tests.el b/test/lisp/emacs-lisp/subr-x-tests.el

index 112f3c1dac159a31ab3e5c1add8edcb7fe83e2c2..ef04cde3867295a22859d7542e1f647893f15416 100644 (file)
--- a/test/lisp/emacs-lisp/subr-x-tests.el
+++ b/test/lisp/emacs-lisp/subr-x-tests.el
@@ -607,18 +607,21 @@
    (should (equal (string-limit "foó" 4 nil 'utf-8) "fo\303\263"))
    (should (equal (string-limit "foóa" 4 nil 'utf-8) "fo\303\263"))
    (should (equal (string-limit "foóá" 4 nil 'utf-8) "fo\303\263"))
+  (should (equal (string-limit "foóá" 4 nil 'utf-8-with-signature)
+                 "fo\303\263"))
    (should (equal (string-limit "foóa" 4 nil 'iso-8859-1) "fo\363a"))
    (should (equal (string-limit "foóá" 4 nil 'iso-8859-1) "fo\363\341"))
-  (should (equal (string-limit "foóá" 4 nil 'utf-16) "\376\377\000f"))
+  (should (equal (string-limit "foóá" 4 nil 'utf-16) "\000f\000o"))
  
    (should (equal (string-limit "foó" 10 t 'utf-8) "fo\303\263"))
    (should (equal (string-limit "foó" 3 t 'utf-8) "o\303\263"))
    (should (equal (string-limit "foó" 4 t 'utf-8) "fo\303\263"))
    (should (equal (string-limit "foóa" 4 t 'utf-8) "o\303\263a"))
    (should (equal (string-limit "foóá" 4 t 'utf-8) "\303\263\303\241"))
+  (should (equal (string-limit "foóá" 2 t 'utf-8-with-signature) "\303\241"))
    (should (equal (string-limit "foóa" 4 t 'iso-8859-1) "fo\363a"))
    (should (equal (string-limit "foóá" 4 t 'iso-8859-1) "fo\363\341"))
-  (should (equal (string-limit "foóá" 4 t 'utf-16) "\376\377\000\341")))
+  (should (equal (string-limit "foóá" 4 t 'utf-16) "\000\363\000\341")))
  
  (ert-deftest subr-string-lines ()
    (should (equal (string-lines "foo") '("foo")))
author	Eli Zaretskii <eliz@gnu.org>
	Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)
committer	Eli Zaretskii <eliz@gnu.org>
	Wed, 12 May 2021 13:41:03 +0000 (16:41 +0300)
lisp/emacs-lisp/subr-x.el		patch \| blob \| history
test/lisp/emacs-lisp/subr-x-tests.el		patch \| blob \| history