diff options
author | Moriyoshi Koizumi <moriyoshi@php.net> | 2010-12-19 16:36:37 +0000 |
---|---|---|
committer | Moriyoshi Koizumi <moriyoshi@php.net> | 2010-12-19 16:36:37 +0000 |
commit | bbf3d43c1ee0ad53b03c3821cd630f0746d5e954 (patch) | |
tree | fd11ea79a69ee445ffde8310a3760603bf3df821 /Zend/zend_multibyte.h | |
parent | c28cac404d2d0590ba2811f41331c60d09adbf1e (diff) | |
download | php-git-bbf3d43c1ee0ad53b03c3821cd630f0746d5e954.tar.gz |
* Refactor zend_multibyte facility.
Now mbstring.script_encoding is superseded by zend.script_encoding.
Diffstat (limited to 'Zend/zend_multibyte.h')
-rw-r--r-- | Zend/zend_multibyte.h | 85 |
1 files changed, 44 insertions, 41 deletions
diff --git a/Zend/zend_multibyte.h b/Zend/zend_multibyte.h index 94d8417b80..8233da6b39 100644 --- a/Zend/zend_multibyte.h +++ b/Zend/zend_multibyte.h @@ -22,59 +22,62 @@ #ifndef ZEND_MULTIBYTE_H #define ZEND_MULTIBYTE_H -#define BOM_UTF32_BE "\x00\x00\xfe\xff" -#define BOM_UTF32_LE "\xff\xfe\x00\x00" -#define BOM_UTF16_BE "\xfe\xff" -#define BOM_UTF16_LE "\xff\xfe" -#define BOM_UTF8 "\xef\xbb\xbf" +typedef struct _zend_encoding zend_encoding; typedef size_t (*zend_encoding_filter)(unsigned char **str, size_t *str_length, const unsigned char *buf, size_t length TSRMLS_DC); -typedef char* (*zend_encoding_detector)(const unsigned char *string, size_t length, char *list TSRMLS_DC); - -typedef int (*zend_encoding_converter)(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length, const char *encoding_to, const char *encoding_from TSRMLS_DC); - -typedef size_t (*zend_encoding_oddlen)(const unsigned char *string, size_t length, const char *encoding TSRMLS_DC); - -typedef int (*zend_encoding_list_checker)(const char *encoding_list TSRMLS_DC); - -typedef const char* (*zend_encoding_name_getter)(TSRMLS_D); - -typedef struct _zend_encoding { - zend_encoding_filter input_filter; /* escape input filter */ - zend_encoding_filter output_filter; /* escape output filter */ - const char *name; /* encoding name */ - const char *(*aliases)[]; /* encoding name aliases */ - zend_bool compatible; /* flex compatible or not */ -} zend_encoding; - +typedef const zend_encoding* (*zend_encoding_fetcher)(const char *encoding_name TSRMLS_DC); +typedef const char* (*zend_encoding_name_getter)(const zend_encoding *encoding); +typedef int (*zend_encoding_lexer_compatibility_checker)(const zend_encoding *encoding); +typedef const zend_encoding *(*zend_encoding_detector)(const unsigned char *string, size_t length, const zend_encoding **list, size_t list_size TSRMLS_DC); +typedef size_t (*zend_encoding_converter)(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length, const zend_encoding *encoding_to, const zend_encoding *encoding_from TSRMLS_DC); +typedef int (*zend_encoding_list_parser)(const char *encoding_list, size_t encoding_list_len, const zend_encoding ***return_list, size_t *return_size, int persistent TSRMLS_DC); +typedef const zend_encoding *(*zend_encoding_internal_encoding_getter)(TSRMLS_D); +typedef int (*zend_encoding_internal_encoding_setter)(const zend_encoding *encoding TSRMLS_DC); + +typedef struct _zend_multibyte_functions { + const char *provider_name; + zend_encoding_fetcher encoding_fetcher; + zend_encoding_name_getter encoding_name_getter; + zend_encoding_lexer_compatibility_checker lexer_compatibility_checker; + zend_encoding_detector encoding_detector; + zend_encoding_converter encoding_converter; + zend_encoding_list_parser encoding_list_parser; + zend_encoding_internal_encoding_getter internal_encoding_getter; + zend_encoding_internal_encoding_setter internal_encoding_setter; +} zend_multibyte_functions; /* * zend multibyte APIs */ BEGIN_EXTERN_C() -/* multibyte utility functions */ -ZEND_API extern zend_encoding_detector zend_multibyte_encoding_detector; -ZEND_API extern zend_encoding_converter zend_multibyte_encoding_converter; -ZEND_API extern zend_encoding_oddlen zend_multibyte_encoding_oddlen; -ZEND_API extern zend_encoding_list_checker zend_multibyte_check_encoding_list; -ZEND_API extern zend_encoding_name_getter zend_multibyte_get_internal_encoding; +ZEND_API extern const zend_encoding *zend_multibyte_encoding_utf32be; +ZEND_API extern const zend_encoding *zend_multibyte_encoding_utf32le; +ZEND_API extern const zend_encoding *zend_multibyte_encoding_utf16be; +ZEND_API extern const zend_encoding *zend_multibyte_encoding_utf16le; +ZEND_API extern const zend_encoding *zend_multibyte_encoding_utf8; -ZEND_API int zend_multibyte_set_script_encoding(const char *encoding_list, -size_t encoding_list_size TSRMLS_DC); -ZEND_API int zend_multibyte_set_internal_encoding(const char *encoding_name TSRMLS_DC); -ZEND_API int zend_multibyte_set_functions(zend_encoding_detector encoding_detector, zend_encoding_converter encoding_converter, zend_encoding_oddlen encoding_oddlen, zend_encoding_list_checker encoding_list_checker, zend_encoding_name_getter get_internal_encoding TSRMLS_DC); -ZEND_API int zend_multibyte_set_filter(zend_encoding *onetime_encoding TSRMLS_DC); -ZEND_API zend_encoding* zend_multibyte_fetch_encoding(const char *encoding_name); -ZEND_API size_t zend_multibyte_script_encoding_filter(unsigned char **to, size_t -*to_length, const unsigned char *from, size_t from_length TSRMLS_DC); +/* multibyte utility functions */ +ZEND_API int zend_multibyte_set_functions(const zend_multibyte_functions *functions TSRMLS_DC); +ZEND_API const zend_multibyte_functions *zend_multibyte_get_functions(TSRMLS_D); + +ZEND_API const zend_encoding *zend_multibyte_fetch_encoding(const char *name TSRMLS_DC); +ZEND_API const char *zend_multibyte_get_encoding_name(const zend_encoding *encoding); +ZEND_API int zend_multibyte_check_lexer_compatibility(const zend_encoding *encoding); +ZEND_API const zend_encoding *zend_multibyte_encoding_detector(const unsigned char *string, size_t length, const zend_encoding **list, size_t list_size TSRMLS_DC); +ZEND_API size_t zend_multibyte_encoding_converter(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length, const zend_encoding *encoding_to, const zend_encoding *encoding_from TSRMLS_DC); +ZEND_API int zend_multibyte_parse_encoding_list(const char *encoding_list, size_t encoding_list_len, const zend_encoding ***return_list, size_t *return_size, int persistent TSRMLS_DC); + +ZEND_API const zend_encoding *zend_multibyte_get_internal_encoding(TSRMLS_D); +ZEND_API const zend_encoding *zend_multibyte_get_script_encoding(TSRMLS_D); +ZEND_API int zend_multibyte_set_script_encoding(const zend_encoding **encoding_list, size_t encoding_list_size TSRMLS_DC); +ZEND_API int zend_multibyte_set_internal_encoding(const zend_encoding *encoding TSRMLS_DC); +ZEND_API int zend_multibyte_set_script_encoding_by_string(const char *new_value, size_t new_value_length TSRMLS_DC); + +ZEND_API size_t zend_multibyte_script_encoding_filter(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length TSRMLS_DC); ZEND_API size_t zend_multibyte_internal_encoding_filter(unsigned char **to, size_t *to_length, const unsigned char *from, size_t from_length TSRMLS_DC); -/* in zend_language_scanner.l */ -ZEND_API void zend_multibyte_yyinput_again(zend_encoding_filter old_input_filter, zend_encoding *old_encoding TSRMLS_DC); -ZEND_API int zend_multibyte_yyinput(zend_file_handle *file_handle, char *buf, size_t len TSRMLS_DC); -ZEND_API int zend_multibyte_read_script(unsigned char *buf, size_t n TSRMLS_DC); END_EXTERN_C() #endif /* ZEND_MULTIBYTE_H */ |