summaryrefslogtreecommitdiff
path: root/src/coding.c
diff options
context:
space:
mode:
authorEli Zaretskii <eliz@gnu.org>2020-04-09 12:18:30 +0300
committerEli Zaretskii <eliz@gnu.org>2020-04-09 12:18:30 +0300
commitfaf996dc6e963a8dd74e9e794ded0467dd78ea18 (patch)
tree05414568c1e99a0226101e37fb94dc4ade687699 /src/coding.c
parent1aeb1819353418ebed635f18a009048700ba1ad0 (diff)
downloademacs-faf996dc6e963a8dd74e9e794ded0467dd78ea18.tar.gz
Fix decoding ASCII strings with embedded CR characters
* src/coding.c (string_ascii_p): Return a negative value if an all-ASCII string STR includes the CR character, otherwise a positive value. (code_convert_string): If the string is ASCII, but includes CR characters, use the fast path only if EOL doesn't need to be decoded. (Bug#40519) * test/src/coding-tests.el (coding-nocopy-ascii): Add tests for bug#40519.
Diffstat (limited to 'src/coding.c')
-rw-r--r--src/coding.c37
1 files changed, 26 insertions, 11 deletions
diff --git a/src/coding.c b/src/coding.c
index 49c1e625d57..24a832ff3ee 100644
--- a/src/coding.c
+++ b/src/coding.c
@@ -9471,15 +9471,22 @@ not fully specified.) */)
return code_convert_region (start, end, coding_system, destination, 1, 0);
}
-/* Whether a string only contains chars in the 0..127 range. */
-static bool
+/* Non-zero if STR contains only characterss in the 0..127 range.
+ Positive if STR includes characters that don't need EOL conversion
+ on decoding, negative otherwise. */
+static int
string_ascii_p (Lisp_Object str)
{
ptrdiff_t nbytes = SBYTES (str);
+ bool CR_Seen = false;
for (ptrdiff_t i = 0; i < nbytes; i++)
- if (SREF (str, i) > 127)
- return false;
- return true;
+ {
+ if (SREF (str, i) > 127)
+ return 0;
+ if (SREF (str, i) == '\r')
+ CR_Seen = true;
+ }
+ return CR_Seen ? -1 : 1;
}
Lisp_Object
@@ -9517,15 +9524,23 @@ code_convert_string (Lisp_Object string, Lisp_Object coding_system,
{
/* Fast path for ASCII-only input and an ASCII-compatible coding:
act as identity. */
+ int ascii_p;
Lisp_Object attrs = CODING_ID_ATTRS (coding.id);
if (! NILP (CODING_ATTR_ASCII_COMPAT (attrs))
&& (STRING_MULTIBYTE (string)
- ? (chars == bytes) : string_ascii_p (string)))
- return (nocopy
- ? string
- : (encodep
- ? make_unibyte_string (SSDATA (string), bytes)
- : make_multibyte_string (SSDATA (string), bytes, bytes)));
+ ? (chars == bytes) : ((ascii_p = string_ascii_p (string)) != 0)))
+ {
+ if (ascii_p > 0
+ || (ascii_p < 0
+ && (EQ (CODING_ID_EOL_TYPE (coding.id), Qunix)
+ || inhibit_eol_conversion)))
+ return (nocopy
+ ? string
+ : (encodep
+ ? make_unibyte_string (SSDATA (string), bytes)
+ : make_multibyte_string (SSDATA (string),
+ bytes, bytes)));
+ }
}
else if (BUFFERP (dst_object))
{