summaryrefslogtreecommitdiff
path: root/ext/json
diff options
context:
space:
mode:
authorDmitry Stogov <dmitry@zend.com>2017-05-25 01:16:17 +0300
committerDmitry Stogov <dmitry@zend.com>2017-05-25 01:16:17 +0300
commit13ee8fd626accebd93f943d2d1d23a6e952e060f (patch)
tree8acb8b8997333262df0450c7f191c3fd05a386c0 /ext/json
parentfa828dbe841c654dd7ac87c26929b873168eaea2 (diff)
downloadphp-git-13ee8fd626accebd93f943d2d1d23a6e952e060f.tar.gz
Improved UTF-8 validation in JSON
Diffstat (limited to 'ext/json')
-rw-r--r--ext/json/json_encoder.c37
1 files changed, 10 insertions, 27 deletions
diff --git a/ext/json/json_encoder.c b/ext/json/json_encoder.c
index c88d355fc0..545d229f35 100644
--- a/ext/json/json_encoder.c
+++ b/ext/json/json_encoder.c
@@ -246,40 +246,23 @@ static int php_json_encode_array(smart_str *buf, zval *val, int options, php_jso
}
/* }}} */
-static int php_json_utf8_to_utf16(unsigned short *utf16, char utf8[], size_t len) /* {{{ */
+static int php_json_valid_utf8(char utf8[], size_t len) /* {{{ */
{
size_t pos = 0, us;
- int j, status;
+ int status;
- if (utf16) {
- /* really convert the utf8 string */
- for (j=0 ; pos < len ; j++) {
- us = php_next_utf8_char((const unsigned char *)utf8, len, &pos, &status);
- if (status != SUCCESS) {
- return -1;
- }
- /* From http://en.wikipedia.org/wiki/UTF16 */
- if (us >= 0x10000) {
- us -= 0x10000;
- utf16[j++] = (unsigned short)((us >> 10) | 0xd800);
- utf16[j] = (unsigned short)((us & 0x3ff) | 0xdc00);
- } else {
- utf16[j] = (unsigned short)us;
- }
- }
- } else {
- /* Only check if utf8 string is valid, and compute utf16 length */
- for (j=0 ; pos < len ; j++) {
+ while (pos < len) {
+ us = (unsigned char)utf8[pos];
+ if (us < 0x80) {
+ pos++;
+ } else {
us = php_next_utf8_char((const unsigned char *)utf8, len, &pos, &status);
if (status != SUCCESS) {
- return -1;
- }
- if (us >= 0x10000) {
- j++;
+ return 0;
}
}
}
- return j;
+ return 1;
}
/* }}} */
@@ -315,7 +298,7 @@ static int php_json_escape_string(
if (options & PHP_JSON_UNESCAPED_UNICODE) {
/* validate UTF-8 string first */
- if (php_json_utf8_to_utf16(NULL, s, len) < 0) {
+ if (!php_json_valid_utf8(s, len)) {
encoder->error_code = PHP_JSON_ERROR_UTF8;
if (options & PHP_JSON_PARTIAL_OUTPUT_ON_ERROR) {
smart_str_appendl(buf, "null", 4);