diff options
Diffstat (limited to 'pango/utils.c')
-rw-r--r-- | pango/utils.c | 153 |
1 files changed, 153 insertions, 0 deletions
diff --git a/pango/utils.c b/pango/utils.c new file mode 100644 index 00000000..d3ab9fdd --- /dev/null +++ b/pango/utils.c @@ -0,0 +1,153 @@ +/* Pango + * utils.c: + * + * Copyright (C) 1999 Red Hat Software + * + * This library is free software; you can redistribute it and/or + * modify it under the terms of the GNU Library General Public + * License as published by the Free Software Foundation; either + * version 2 of the License, or (at your option) any later version. + * + * This library is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + * Library General Public License for more details. + * + * You should have received a copy of the GNU Library General Public + * License along with this library; if not, write to the + * Free Software Foundation, Inc., 59 Temple Place - Suite 330, + * Boston, MA 02111-1307, USA. + */ + +#include "utils.h" +#include <iconv.h> +#include <errno.h> +#include <unicode.h> + +gboolean +_pango_utf8_iterate (gchar *cur, char **next, GUChar4 *wc_out) +{ + gchar *p = cur; + gchar c = *p; + GUChar4 wc; + gint length; + + if ((c & 0x80) == 0) + { + length = 1; + wc = c; + } + else if ((c & 0xc0) == 0x80) + { + return FALSE; + } + else if ((c & 0xe0) == 0xc0) + { + length = 2; + wc = c & 0x1f; + } + else if ((c & 0xf0) == 0xe0) + { + length = 3; + wc = c & 0x0f; + } + else + return FALSE; + + p++; + while (--length > 0) + { + if (*p == 0) /* Incomplete character */ + { + if (next) + *next = cur; + if (wc_out) + *wc_out = 0; + return TRUE; + } + + if ((*p & 0xc0) != 0x80) + return FALSE; + + wc <<= 6; + wc |= (*p) & 0x3f; + + p++; + } + + if (wc_out) + *wc_out = wc; + if (next) + *next = p; + + return TRUE; +} + +gint +_pango_utf8_len (gchar *str, gint limit) +{ + gchar *cur = str; + gchar *next; + gint len = 0; + + while (*cur) + { + if (!_pango_utf8_iterate (cur, &next, NULL)) + return -1; + if (cur == next) + break; + if (limit >= 0 && (next - str) > limit) + return len; + cur = next; + len++; + } + + return len; +} + +#if G_BYTE_ORDER == G_LITTLE_ENDIAN +#define UCS2_CHARSET "UNICODELITTLE" +#else +#define UCS2_CHARSET "UNICODE" +#endif + +GUChar2 * +_pango_utf8_to_ucs2 (gchar *str, gint len) +{ + iconv_t cd; + gchar *outbuf, *result; + gchar *inbuf; + size_t inbytesleft; + size_t outbytesleft; + gint outlen; + + gint count; + + cd = iconv_open (UCS2_CHARSET, "UTF8"); + + if (cd == (iconv_t)-1) + g_error ("No converter from UTF8 to " UCS2_CHARSET); + + if (len < 0) + len = strlen (str); + + outlen = unicode_strlen (str, len) * sizeof(GUChar2); + result = g_malloc (outlen); + + inbuf = str; + inbytesleft = len; + outbuf = result; + outbytesleft = outlen; + + count = iconv (cd, &inbuf, &inbytesleft, &outbuf, &outbytesleft); + + if (count < 0 && (errno != E2BIG)) + { + g_free (result); + result = NULL; + } + + iconv_close (cd); + + return (GUChar2 *)result; +} |