summaryrefslogtreecommitdiff
path: root/strings
diff options
context:
space:
mode:
authorunknown <konstantin@mysql.com>2005-01-13 17:31:49 +0300
committerunknown <konstantin@mysql.com>2005-01-13 17:31:49 +0300
commit9c4824af7c1985d7d439f523aa8a85402cde9808 (patch)
tree589a6b326750729b4c6b6133c6f985394d9d387a /strings
parent9d983c4550cf8e5c5342509f6508ca0e35600acd (diff)
parent9842aca3ef48bf56a6c3ee5b9e1159e4249ce346 (diff)
downloadmariadb-git-9c4824af7c1985d7d439f523aa8a85402cde9808.tar.gz
manual merge
mysql-test/r/ctype_latin1_de.result: Auto merged mysql-test/r/ctype_tis620.result: Auto merged mysql-test/r/ctype_ucs.result: Auto merged mysql-test/r/ctype_ujis.result: Auto merged mysql-test/r/ctype_utf8.result: Auto merged mysql-test/t/ctype_ucs.test: Auto merged sql/field.cc: Auto merged sql/filesort.cc: Auto merged strings/ctype-big5.c: Auto merged strings/ctype-bin.c: Auto merged strings/ctype-czech.c: Auto merged strings/ctype-gbk.c: Auto merged strings/ctype-latin1.c: Auto merged strings/ctype-mb.c: Auto merged strings/ctype-simple.c: Auto merged strings/ctype-sjis.c: Auto merged strings/ctype-tis620.c: Auto merged strings/ctype-uca.c: Auto merged strings/ctype-ucs2.c: Auto merged strings/ctype-utf8.c: Auto merged strings/ctype-win1250ch.c: Auto merged
Diffstat (limited to 'strings')
-rw-r--r--strings/ctype-big5.c5
-rw-r--r--strings/ctype-bin.c26
-rw-r--r--strings/ctype-czech.c8
-rw-r--r--strings/ctype-gbk.c5
-rw-r--r--strings/ctype-latin1.c5
-rw-r--r--strings/ctype-mb.c11
-rw-r--r--strings/ctype-simple.c45
-rw-r--r--strings/ctype-sjis.c4
-rw-r--r--strings/ctype-tis620.c6
-rw-r--r--strings/ctype-uca.c16
-rw-r--r--strings/ctype-ucs2.c9
-rw-r--r--strings/ctype-utf8.c5
-rw-r--r--strings/ctype-win1250ch.c4
13 files changed, 117 insertions, 32 deletions
diff --git a/strings/ctype-big5.c b/strings/ctype-big5.c
index d9532cddc4d..a2db7de244e 100644
--- a/strings/ctype-big5.c
+++ b/strings/ctype-big5.c
@@ -307,6 +307,7 @@ static int my_strnxfrm_big5(CHARSET_INFO *cs __attribute__((unused)),
const uchar * src, uint srclen)
{
uint16 e;
+ uint dstlen= len;
len = srclen;
while (len--)
@@ -321,7 +322,9 @@ static int my_strnxfrm_big5(CHARSET_INFO *cs __attribute__((unused)),
} else
*dest++ = sort_order_big5[(uchar) *src++];
}
- return srclen;
+ if (dstlen > srclen)
+ bfill(dest, dstlen - srclen, ' ');
+ return dstlen;
}
#if 0
diff --git a/strings/ctype-bin.c b/strings/ctype-bin.c
index db57c75d9f1..401605a462f 100644
--- a/strings/ctype-bin.c
+++ b/strings/ctype-bin.c
@@ -356,13 +356,27 @@ static int my_wildcmp_bin(CHARSET_INFO *cs,
static int my_strnxfrm_bin(CHARSET_INFO *cs __attribute__((unused)),
- uchar * dest, uint len,
- const uchar *src,
- uint srclen __attribute__((unused)))
+ uchar * dest, uint dstlen,
+ const uchar *src, uint srclen)
{
if (dest != src)
- memcpy(dest,src,len= min(len,srclen));
- return len;
+ memcpy(dest, src, min(dstlen,srclen));
+ if (dstlen > srclen)
+ bfill(dest + srclen, dstlen - srclen, 0);
+ return dstlen;
+}
+
+
+static
+int my_strnxfrm_8bit_bin(CHARSET_INFO *cs __attribute__((unused)),
+ uchar * dest, uint dstlen,
+ const uchar *src, uint srclen)
+{
+ if (dest != src)
+ memcpy(dest, src, min(dstlen,srclen));
+ if (dstlen > srclen)
+ bfill(dest + srclen, dstlen - srclen, ' ');
+ return dstlen;
}
@@ -432,7 +446,7 @@ MY_COLLATION_HANDLER my_collation_8bit_bin_handler =
NULL, /* init */
my_strnncoll_8bit_bin,
my_strnncollsp_8bit_bin,
- my_strnxfrm_bin,
+ my_strnxfrm_8bit_bin,
my_like_range_simple,
my_wildcmp_bin,
my_strcasecmp_bin,
diff --git a/strings/ctype-czech.c b/strings/ctype-czech.c
index 76981200a4d..2834dbb28ff 100644
--- a/strings/ctype-czech.c
+++ b/strings/ctype-czech.c
@@ -298,16 +298,18 @@ static int my_strnxfrm_czech(CHARSET_INFO *cs __attribute__((unused)),
int value;
const uchar * p, * store;
int pass = 0;
- int totlen = 0;
+ uint totlen = 0;
p = src; store = src;
do
{
NEXT_CMP_VALUE(src, p, store, pass, value, (int)srclen);
- ADD_TO_RESULT(dest, (int)len, totlen, value);
+ ADD_TO_RESULT(dest, len, totlen, value);
}
while (value);
- return totlen;
+ if (len > totlen)
+ bfill(dest + totlen, len - totlen, ' ');
+ return len;
}
#undef IS_END
diff --git a/strings/ctype-gbk.c b/strings/ctype-gbk.c
index 858624c0600..dc4aea60096 100644
--- a/strings/ctype-gbk.c
+++ b/strings/ctype-gbk.c
@@ -2668,6 +2668,7 @@ static int my_strnxfrm_gbk(CHARSET_INFO *cs __attribute__((unused)),
const uchar * src, uint srclen)
{
uint16 e;
+ uint dstlen= len;
len = srclen;
while (len--)
@@ -2682,7 +2683,9 @@ static int my_strnxfrm_gbk(CHARSET_INFO *cs __attribute__((unused)),
} else
*dest++ = sort_order_gbk[(uchar) *src++];
}
- return srclen;
+ if (dstlen > srclen)
+ bfill(dest, dstlen - srclen, ' ');
+ return dstlen;
}
diff --git a/strings/ctype-latin1.c b/strings/ctype-latin1.c
index 69c9ed4b023..b5da99a7452 100644
--- a/strings/ctype-latin1.c
+++ b/strings/ctype-latin1.c
@@ -646,7 +646,6 @@ static int my_strnxfrm_latin1_de(CHARSET_INFO *cs __attribute__((unused)),
uchar * dest, uint len,
const uchar * src, uint srclen)
{
- const uchar *dest_orig = dest;
const uchar *de = dest + len;
const uchar *se = src + srclen;
for ( ; src < se && dest < de ; src++)
@@ -656,7 +655,9 @@ static int my_strnxfrm_latin1_de(CHARSET_INFO *cs __attribute__((unused)),
if ((chr=combo2map[*src]) && dest < de)
*dest++=chr;
}
- return (int) (dest - dest_orig);
+ if (dest < de)
+ bfill(dest, de - dest, ' ');
+ return (int) len;
}
diff --git a/strings/ctype-mb.c b/strings/ctype-mb.c
index 0475fb0fbb1..4be21599fef 100644
--- a/strings/ctype-mb.c
+++ b/strings/ctype-mb.c
@@ -425,13 +425,14 @@ static int my_strnncollsp_mb_bin(CHARSET_INFO * cs __attribute__((unused)),
static int my_strnxfrm_mb_bin(CHARSET_INFO *cs __attribute__((unused)),
- uchar * dest, uint len,
- const uchar *src,
- uint srclen __attribute__((unused)))
+ uchar * dest, uint dstlen,
+ const uchar *src, uint srclen)
{
if (dest != src)
- memcpy(dest,src,len= min(len,srclen));
- return len;
+ memcpy(dest, src, min(dstlen, srclen));
+ if (dstlen > srclen)
+ bfill(dest + srclen, dstlen - srclen, ' ');
+ return dstlen;
}
diff --git a/strings/ctype-simple.c b/strings/ctype-simple.c
index 0659cb5d387..1df81c88258 100644
--- a/strings/ctype-simple.c
+++ b/strings/ctype-simple.c
@@ -21,27 +21,68 @@
#include "stdarg.h"
+/*
+ Converts a string into its sort key.
+
+ SYNOPSIS
+ my_strnxfrm_xxx()
+
+ IMPLEMENTATION
+
+ The my_strxfrm_xxx() function transforms a string pointed to by
+ 'src' with length 'srclen' according to the charset+collation
+ pair 'cs' and copies the result key into 'dest'.
+
+ Comparing two strings using memcmp() after my_strnxfrm_xxx()
+ is equal to comparing two original strings with my_strnncollsp_xxx().
+
+ Not more than 'dstlen' bytes are written into 'dst'.
+ To garantee that the whole string is transformed, 'dstlen' must be
+ at least srclen*cs->strnxfrm_multiply bytes long. Otherwise,
+ consequent memcmp() may return a non-accurate result.
+
+ If the source string is too short to fill whole 'dstlen' bytes,
+ then the 'dest' string is padded up to 'dstlen', ensuring that:
+
+ "a" == "a "
+ "a\0" < "a"
+ "a\0" < "a "
+
+ my_strnxfrm_simple() is implemented for 8bit charsets and
+ simple collations with one-to-one string->key transformation.
+
+ See also implementations for various charsets/collations in
+ other ctype-xxx.c files.
+
+ RETURN
+
+ Target len 'dstlen'.
+
+*/
+
int my_strnxfrm_simple(CHARSET_INFO * cs,
uchar *dest, uint len,
const uchar *src, uint srclen)
{
uchar *map= cs->sort_order;
+ uint dstlen= len;
set_if_smaller(len, srclen);
if (dest != src)
{
const uchar *end;
for ( end=src+len; src < end ; )
*dest++= map[*src++];
- return len;
}
else
{
const uchar *end;
for ( end=dest+len; dest < end ; dest++)
*dest= (char) map[(uchar) *dest];
- return len;
}
+ if (dstlen > len)
+ bfill(dest, dstlen - len, ' ');
+ return dstlen;
}
int my_strnncoll_simple(CHARSET_INFO * cs, const uchar *s, uint slen,
diff --git a/strings/ctype-sjis.c b/strings/ctype-sjis.c
index 12bee9082b6..c1e41dc2d94 100644
--- a/strings/ctype-sjis.c
+++ b/strings/ctype-sjis.c
@@ -299,7 +299,9 @@ static int my_strnxfrm_sjis(CHARSET_INFO *cs __attribute__((unused)),
else
*dest++ = sort_order_sjis[(uchar)*src++];
}
- return srclen;
+ if (len > srclen)
+ bfill(dest, len - srclen, ' ');
+ return len;
}
diff --git a/strings/ctype-tis620.c b/strings/ctype-tis620.c
index 80af8e2014b..c6bdd106ad4 100644
--- a/strings/ctype-tis620.c
+++ b/strings/ctype-tis620.c
@@ -638,9 +638,13 @@ int my_strnxfrm_tis620(CHARSET_INFO *cs __attribute__((unused)),
uchar * dest, uint len,
const uchar * src, uint srclen)
{
+ uint dstlen= len;
len= (uint) (strmake((char*) dest, (char*) src, min(len, srclen)) -
(char*) dest);
- return (int) thai2sortable(dest, len);
+ len= thai2sortable(dest, len);
+ if (dstlen > len)
+ bfill(dest + len, dstlen - len, ' ');
+ return dstlen;
}
diff --git a/strings/ctype-uca.c b/strings/ctype-uca.c
index fb44a56ef0f..605dd2cdab0 100644
--- a/strings/ctype-uca.c
+++ b/strings/ctype-uca.c
@@ -7220,8 +7220,7 @@ static int my_strnxfrm_uca(CHARSET_INFO *cs,
uchar *dst, uint dstlen,
const uchar *src, uint srclen)
{
- uchar *de = dst + dstlen;
- const uchar *dst_orig = dst;
+ uchar *de = dst + (dstlen & (uint) ~1); // add even length for easier code
int s_res;
my_uca_scanner scanner;
scanner_handler->init(&scanner, cs, src, srclen);
@@ -7232,8 +7231,17 @@ static int my_strnxfrm_uca(CHARSET_INFO *cs,
dst[1]= s_res & 0xFF;
dst+= 2;
}
- for ( ; dst < de; *dst++='\0');
- return dst - dst_orig;
+ s_res= cs->sort_order_big[0][0x20 * cs->sort_order[0]];
+ while (dst < de)
+ {
+ dst[0]= s_res >> 8;
+ dst[1]= s_res & 0xFF;
+ dst+= 2;
+ }
+ if (dstlen & 1) // if odd number then fill the last char
+ *dst= '\0';
+
+ return dstlen;
}
diff --git a/strings/ctype-ucs2.c b/strings/ctype-ucs2.c
index d21b340e768..6bd93a93e8a 100644
--- a/strings/ctype-ucs2.c
+++ b/strings/ctype-ucs2.c
@@ -352,7 +352,6 @@ static int my_strnxfrm_ucs2(CHARSET_INFO *cs,
int plane;
uchar *de = dst + dstlen;
const uchar *se = src + srclen;
- const uchar *dst_orig = dst;
while( src < se && dst < de )
{
@@ -372,7 +371,9 @@ static int my_strnxfrm_ucs2(CHARSET_INFO *cs,
}
dst+=res;
}
- return dst - dst_orig;
+ if (dst < de)
+ cs->cset->fill(cs, dst, de - dst, ' ');
+ return dstlen;
}
@@ -1385,7 +1386,9 @@ int my_strnxfrm_ucs2_bin(CHARSET_INFO *cs __attribute__((unused)),
{
if (dst != src)
memcpy(dst,src,srclen= min(dstlen,srclen));
- return srclen;
+ if (dstlen > srclen)
+ cs->cset->fill(cs, dst + srclen, dstlen - srclen, ' ');
+ return dstlen;
}
diff --git a/strings/ctype-utf8.c b/strings/ctype-utf8.c
index ab646d36e25..1f9f158a73d 100644
--- a/strings/ctype-utf8.c
+++ b/strings/ctype-utf8.c
@@ -2247,7 +2247,6 @@ static int my_strnxfrm_utf8(CHARSET_INFO *cs,
int plane;
uchar *de = dst + dstlen;
const uchar *se = src + srclen;
- const uchar *dst_orig = dst;
while( src < se && dst < de )
{
@@ -2267,7 +2266,9 @@ static int my_strnxfrm_utf8(CHARSET_INFO *cs,
}
dst+=res;
}
- return dst - dst_orig;
+ if (dst < de)
+ bfill(dst, de - dst, ' ');
+ return dstlen;
}
static int my_ismbchar_utf8(CHARSET_INFO *cs,const char *b, const char *e)
diff --git a/strings/ctype-win1250ch.c b/strings/ctype-win1250ch.c
index 397dcd6f2f2..b58a8f0f1e5 100644
--- a/strings/ctype-win1250ch.c
+++ b/strings/ctype-win1250ch.c
@@ -505,7 +505,9 @@ static int my_strnxfrm_win1250ch(CHARSET_INFO * cs __attribute__((unused)),
dest[totlen] = value;
totlen++;
} while (value) ;
- return totlen;
+ if (len > totlen)
+ bfill(dest + totlen, len - totlen, ' ');
+ return len;
}
#undef IS_END