diff options
Diffstat (limited to 'gettext-tools/src/po-charset.h')
-rw-r--r-- | gettext-tools/src/po-charset.h | 93 |
1 files changed, 93 insertions, 0 deletions
diff --git a/gettext-tools/src/po-charset.h b/gettext-tools/src/po-charset.h new file mode 100644 index 0000000..65798e7 --- /dev/null +++ b/gettext-tools/src/po-charset.h @@ -0,0 +1,93 @@ +/* Charset handling while reading PO files. + Copyright (C) 2001-2003, 2006 Free Software Foundation, Inc. + Written by Bruno Haible <haible@clisp.cons.org>, 2001. + + This program is free software: you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 3 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program. If not, see <http://www.gnu.org/licenses/>. */ + +#ifndef _PO_CHARSET_H +#define _PO_CHARSET_H + +#include <stdbool.h> +#include <stddef.h> + +#if HAVE_ICONV +#include <iconv.h> +#endif + + +#ifdef __cplusplus +extern "C" { +#endif + + +/* Canonicalize an encoding name. + The results of this function are statically allocated and can be + compared using ==. */ +extern const char *po_charset_canonicalize (const char *charset); + +/* The canonicalized encoding name for ASCII. */ +extern DLL_VARIABLE const char *po_charset_ascii; + +/* The canonicalized encoding name for UTF-8. */ +extern DLL_VARIABLE const char *po_charset_utf8; + +/* Test for ASCII compatibility. */ +extern bool po_charset_ascii_compatible (const char *canon_charset); + +/* Test for a weird encoding, i.e. an encoding which has double-byte + characters ending in 0x5C. */ +extern bool po_is_charset_weird (const char *canon_charset); + +/* Test for a weird CJK encoding, i.e. a weird encoding with CJK structure. + An encoding has CJK structure if every valid character stream is composed + of single bytes in the range 0x{00..7F} and of byte pairs in the range + 0x{80..FF}{30..FF}. */ +extern bool po_is_charset_weird_cjk (const char *canon_charset); + +/* Returns a character iterator for a given encoding. + Given a pointer into a string, it returns the number occupied by the next + single character. If the piece of string is not valid or if the *s == '\0', + it returns 1. */ +typedef size_t (*character_iterator_t) (const char *s); +extern character_iterator_t po_charset_character_iterator (const char *canon_charset); + + +/* The PO file's encoding, as specified in the header entry. */ +extern DLL_VARIABLE const char *po_lex_charset; + +#if HAVE_ICONV +/* Converter from the PO file's encoding to UTF-8. */ +extern DLL_VARIABLE iconv_t po_lex_iconv; +#endif +/* If no converter is available, some information about the structure of the + PO file's encoding. */ +extern DLL_VARIABLE bool po_lex_weird_cjk; + +/* Initialize the PO file's encoding. */ +extern void po_lex_charset_init (void); + +/* Set the PO file's encoding from the header entry. */ +extern void po_lex_charset_set (const char *header_entry, + const char *filename); + +/* Finish up with the PO file's encoding. */ +extern void po_lex_charset_close (void); + + +#ifdef __cplusplus +} +#endif + + +#endif /* _PO_CHARSET_H */ |