Initial commit. Updated bundled oniguruma library (used for multibyte regular expression) to 4.3.1.

author: Seiji Masugata <masugata@php.net> 2006-08-24 17:20:58 +0000
committer: Seiji Masugata <masugata@php.net> 2006-08-24 17:20:58 +0000
commit: 99211d04442b5d92ceff94ccd01e6b57ef23f796 (patch)
tree: 027f88310c759c71833c140765b0f90691b9e04f /ext/mbstring/oniguruma/doc
parent: 74685a184f4b001d608911aa0c7a3cba11eb8fe7 (diff)
download: php-git-99211d04442b5d92ceff94ccd01e6b57ef23f796.tar.gz
6 files changed, 2163 insertions, 0 deletions
diff --git a/ext/mbstring/oniguruma/doc/API b/ext/mbstring/oniguruma/doc/API
new file mode 100644
index 0000000000..7374f65bd4
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/API
@@ -0,0 +1,586 @@
+Oniguruma API  Version 4.1.0  2006/05/15
+
+#include <oniguruma.h>
+
+
+# int onig_init(void)
+
+  Initialize library.
+
+  You don't have to call it explicitly, because it is called in onig_new().
+
+
+# int onig_error_code_to_str(UChar* err_buf, int err_code, ...)
+
+  Get error message string.
+  If this function is used for onig_new(),
+  don't call this after the pattern argument of onig_new() is freed.
+
+  normal return: error message string length
+
+  arguments
+  1 err_buf:              error message string buffer.
+                          (required size: ONIG_MAX_ERROR_MESSAGE_LEN)
+  2 err_code:             error code returned by other API functions.
+  3 err_info (optional):  error info returned by onig_new().
+
+
+# void onig_set_warn_func(OnigWarnFunc func)
+
+  Set warning function.
+
+  WARNING:
+    '[', '-', ']' in character class without escape.
+    ']' in pattern without escape.
+
+  arguments
+  1 func:     function pointer.    void (*func)(char* warning_message)
+
+
+# void onig_set_verb_warn_func(OnigWarnFunc func)
+
+  Set verbose warning function.
+
+  WARNING:
+    redundant nested repeat operator.
+
+  arguments
+  1 func:     function pointer.    void (*func)(char* warning_message)
+
+
+# int onig_new(regex_t** reg, const UChar* pattern, const UChar* pattern_end,
+            OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax,
+            OnigErrorInfo* err_info)
+
+  Create a regex object.
+
+  normal return: ONIG_NORMAL
+
+  arguments
+  1 reg:         return regex object's address.
+  2 pattern:     regex pattern string.
+  3 pattern_end: terminate address of pattern. (pattern + pattern length)
+  4 option:      compile time options.
+
+      ONIG_OPTION_NONE               no option
+      ONIG_OPTION_SINGLELINE         '^' -> '\A', '$' -> '\z', '\Z' -> '\z'
+      ONIG_OPTION_MULTILINE          '.' match with newline
+      ONIG_OPTION_IGNORECASE         ambiguity match on
+      ONIG_OPTION_EXTEND             extended pattern form
+      ONIG_OPTION_FIND_LONGEST       find longest match
+      ONIG_OPTION_FIND_NOT_EMPTY     ignore empty match
+      ONIG_OPTION_NEGATE_SINGLELINE
+            clear ONIG_OPTION_SINGLELINE which is enabled on
+            ONIG_SYNTAX_POSIX_BASIC, ONIG_SYNTAX_POSIX_EXTENDED,
+            ONIG_SYNTAX_PERL, ONIG_SYNTAX_PERL_NG, ONIG_SYNTAX_JAVA
+
+      ONIG_OPTION_DONT_CAPTURE_GROUP only named group captured.
+      ONIG_OPTION_CAPTURE_GROUP      named and no-named group captured.
+
+  5 enc:        character encoding.
+
+      ONIG_ENCODING_ASCII         ASCII
+      ONIG_ENCODING_ISO_8859_1    ISO 8859-1
+      ONIG_ENCODING_ISO_8859_2    ISO 8859-2
+      ONIG_ENCODING_ISO_8859_3    ISO 8859-3
+      ONIG_ENCODING_ISO_8859_4    ISO 8859-4
+      ONIG_ENCODING_ISO_8859_5    ISO 8859-5
+      ONIG_ENCODING_ISO_8859_6    ISO 8859-6
+      ONIG_ENCODING_ISO_8859_7    ISO 8859-7
+      ONIG_ENCODING_ISO_8859_8    ISO 8859-8
+      ONIG_ENCODING_ISO_8859_9    ISO 8859-9
+      ONIG_ENCODING_ISO_8859_10   ISO 8859-10
+      ONIG_ENCODING_ISO_8859_11   ISO 8859-11
+      ONIG_ENCODING_ISO_8859_13   ISO 8859-13
+      ONIG_ENCODING_ISO_8859_14   ISO 8859-14
+      ONIG_ENCODING_ISO_8859_15   ISO 8859-15
+      ONIG_ENCODING_ISO_8859_16   ISO 8859-16
+      ONIG_ENCODING_UTF8          UTF-8
+      ONIG_ENCODING_UTF16_BE      UTF-16BE
+      ONIG_ENCODING_UTF16_LE      UTF-16LE
+      ONIG_ENCODING_UTF32_BE      UTF-32BE
+      ONIG_ENCODING_UTF32_LE      UTF-32LE
+      ONIG_ENCODING_EUC_JP        EUC-JP
+      ONIG_ENCODING_EUC_TW        EUC-TW
+      ONIG_ENCODING_EUC_KR        EUC-KR
+      ONIG_ENCODING_EUC_CN        EUC-CN
+      ONIG_ENCODING_SJIS          Shift_JIS
+      ONIG_ENCODING_KOI8          KOI8
+      ONIG_ENCODING_KOI8_R        KOI8-R
+      ONIG_ENCODING_BIG5          Big5
+      ONIG_ENCODING_GB18030       GB 18030
+
+      or any OnigEncodingType data address defined by user.
+
+  6 syntax:     address of pattern syntax definition.
+
+      ONIG_SYNTAX_ASIS              plain text
+      ONIG_SYNTAX_POSIX_BASIC       POSIX Basic RE
+      ONIG_SYNTAX_POSIX_EXTENDED    POSIX Extended RE
+      ONIG_SYNTAX_EMACS             Emacs
+      ONIG_SYNTAX_GREP              grep
+      ONIG_SYNTAX_GNU_REGEX         GNU regex
+      ONIG_SYNTAX_JAVA              Java (Sun java.util.regex)
+      ONIG_SYNTAX_PERL              Perl
+      ONIG_SYNTAX_PERL_NG           Perl + named group
+      ONIG_SYNTAX_RUBY              Ruby
+      ONIG_SYNTAX_DEFAULT           default (== Ruby)
+                                   onig_set_default_syntax()
+
+      or any OnigSyntaxType data address defined by user.
+
+  7 err_info: address for return optional error info.
+              Use this value as 3rd argument of onig_error_code_to_str().
+
+
+
+# int onig_new_deluxe(regex_t** reg, const UChar* pattern, const UChar* pattern_end,
+                      OnigCompileInfo* ci, OnigErrorInfo* einfo)
+
+  Create a regex object.
+  This function is deluxe version of onig_new().
+
+  normal return: ONIG_NORMAL
+
+  arguments
+  1 reg:         return address of regex object.
+  2 pattern:     regex pattern string.
+  3 pattern_end: terminate address of pattern. (pattern + pattern length)
+  4 ci:          compile time info.
+
+    ci->num_of_elements: number of elements in ci. (current version: 5)
+    ci->pattern_enc:     pattern string character encoding.
+    ci->target_enc:      target string character encoding.
+    ci->syntax:          address of pattern syntax definition.
+    ci->option:          compile time option.
+    ci->ambig_flag:      character matching ambiguity bit flag for 
+                         ONIG_OPTION_IGNORECASE mode.
+
+       ONIGENC_AMBIGUOUS_MATCH_NONE:          exact
+       ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE:    ignore case for ASCII
+       ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE: ignore case for non-ASCII
+       ONIGENC_AMBIGUOUS_MATCH_COMPOUND:      grapheme cluster as a char
+       ONIGENC_AMBIGUOUS_MATCH_FULL:          all ambiguity on
+       ONIGENC_AMBIGUOUS_MATCH_DEFAULT:       (ASCII | NONASCII)
+                                              onig_set_default_ambig_flag()
+
+  5 err_info:    address for return optional error info.
+                 Use this value as 3rd argument of onig_error_code_to_str().
+
+
+  Different character encoding combination is allowed for
+  the following cases only.
+
+    pattern_enc: ASCII, ISO_8859_1
+    target_enc:  UTF16_BE, UTF16_LE, UTF32_BE, UTF32_LE
+
+    pattern_enc: UTF16_BE/LE
+    target_enc:  UTF16_LE/BE
+
+    pattern_enc: UTF32_BE/LE
+    target_enc:  UTF32_LE/BE
+
+
+# void onig_free(regex_t* reg)
+
+  Free memory used by regex object.
+
+  arguments
+  1 reg: regex object.
+
+
+# int onig_search(regex_t* reg, const UChar* str, const UChar* end, const UChar* start,
+                   const UChar* range, OnigRegion* region, OnigOptionType option)
+
+  Search string and return search result and matching region.
+
+  normal return: match position offset (i.e.  p - str >= 0)
+  not found:     ONIG_MISMATCH (< 0)
+
+  arguments
+  1 reg:    regex object
+  2 str:    target string
+  3 end:    terminate address of target string
+  4 start:  search start address of target string
+  5 range:  search terminate address of target string
+    in forward search  (start <= searched string head < range)
+    in backward search (range <= searched string head <= start)
+  6 region: address for return group match range info (NULL is allowed)
+  7 option: search time option
+
+    ONIG_OPTION_NOTBOL        string head(str) isn't considered as begin of line
+    ONIG_OPTION_NOTEOL        string end (end) isn't considered as end of line
+    ONIG_OPTION_POSIX_REGION  region argument is regmatch_t[] of POSIX API.
+
+
+# int onig_match(regex_t* reg, const UChar* str, const UChar* end, const UChar* at,
+		 OnigRegion* region, OnigOptionType option)
+
+  Match string and return result and matching region.
+
+  normal return: match length  (>= 0)
+  not match:     ONIG_MISMATCH ( < 0)
+
+  arguments
+  1 reg:    regex object
+  2 str:    target string
+  3 end:    terminate address of target string
+  4 at:     match address of target string
+  5 region: address for return group match range info (NULL is allowed)
+  6 option: search time option
+
+    ONIG_OPTION_NOTBOL       string head(str) isn't considered as begin of line
+    ONIG_OPTION_NOTEOL       string end (end) isn't considered as end of line
+    ONIG_OPTION_POSIX_REGION region argument is regmatch_t[] type of POSIX API.
+
+
+# OnigRegion* onig_region_new(void)
+
+  Create a region.
+
+
+# void onig_region_free(OnigRegion* region, int free_self)
+
+  Free memory used by region.
+
+  arguments
+  1 region:    target region
+  2 free_self: [1: free all, 0: free memory used in region but not self]
+
+
+# void onig_region_copy(OnigRegion* to, OnigRegion* from)
+
+  Copy contents of region.
+
+  arguments
+  1 to:   target region
+  2 from: source region
+
+
+# void onig_region_clear(OnigRegion* region)
+
+  Clear contents of region.
+
+  arguments
+  1 region: target region
+
+
+# int onig_region_resize(OnigRegion* region, int n)
+
+  Resize group range area of region.
+
+  normal return: ONIG_NORMAL
+
+  arguments
+  1 region: target region
+  2 n:      new size
+
+
+# int onig_name_to_group_numbers(regex_t* reg, const UChar* name, const UChar* name_end,
+                                  int** num_list)
+
+  Return the group number list of the name.
+  Named subexp is defined by (?<name>....).
+
+  normal return:  number of groups for the name.
+                  (ex. /(?<x>..)(?<x>..)/  ==>  2)
+  name not found: -1
+
+  arguments
+  1 reg:       regex object.
+  2 name:      group name.
+  3 name_end:  terminate address of group name.
+  4 num_list:  return list of group number.
+
+
+# int onig_name_to_backref_number(regex_t* reg, const UChar* name, const UChar* name_end,
+                                  OnigRegion *region)
+
+  Return the group number corresponding to the named backref (\k<name>).
+  If two or more regions for the groups of the name are effective,
+  the greatest number in it is obtained.
+
+  normal return: group number.
+
+  arguments
+  1 reg:      regex object.
+  2 name:     group name.
+  3 name_end: terminate address of group name.
+  4 region:   search/match result region.
+
+
+# int onig_foreach_name(regex_t* reg,
+                        int (*func)(const UChar*, const UChar*, int,int*,regex_t*,void*),
+                        void* arg)
+
+  Iterate function call for all names.
+
+  normal return: 0
+  error:         func's return value.
+
+  arguments
+  1 reg:     regex object.
+  2 func:    callback function.
+             func(name, name_end, <number of groups>, <group number's list>,
+                  reg, arg);
+             if func does not return 0, then iteration is stopped.
+  3 arg:     argument for func.
+
+
+# int onig_number_of_names(regex_t* reg)
+
+  Return the number of names defined in the pattern.
+  Multiple definitions of one name is counted as one.
+
+  arguments
+  1 reg:     regex object.
+
+
+# OnigEncoding    onig_get_encoding(regex_t* reg)
+# OnigOptionType  onig_get_options(regex_t* reg)
+# OnigAmbigType   onig_get_ambig_flag(regex_t* reg)
+# OnigSyntaxType* onig_get_syntax(regex_t* reg)
+
+  Return a value of the regex object.
+
+  arguments
+  1 reg:     regex object.
+
+
+# int onig_number_of_captures(regex_t* reg)
+
+  Return the number of capture group in the pattern.
+
+  arguments
+  1 reg:     regex object.
+
+
+# int onig_number_of_capture_histories(regex_t* reg)
+
+  Return the number of capture history defined in the pattern.
+
+  You can't use capture history if ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY
+  is disabled in the pattern syntax.(disabled in the default syntax)
+
+  arguments
+  1 reg:     regex object.
+
+
+
+# OnigCaptureTreeNode* onig_get_capture_tree(OnigRegion* region)
+
+  Return the root node of capture history data tree.
+
+  This value is undefined if matching has faild.
+
+  arguments
+  1 region: matching result.
+
+
+# int onig_capture_tree_traverse(OnigRegion* region, int at,
+                  int(*func)(int,int,int,int,int,void*), void* arg)
+
+ Traverse and callback in capture history data tree.
+
+  normal return: 0
+  error:         callback func's return value.
+
+  arguments
+  1 region:  match region data.
+  2 at:      callback position.
+
+    ONIG_TRAVERSE_CALLBACK_AT_FIRST: callback first, then traverse childs.
+    ONIG_TRAVERSE_CALLBACK_AT_LAST:  traverse childs first, then callback.
+    ONIG_TRAVERSE_CALLBACK_AT_BOTH:  callback first, then traverse childs,
+                                     and at last callback again.
+
+  3 func:    callback function.
+             if func does not return 0, then traverse is stopped.
+
+             int func(int group, int beg, int end, int level, int at,
+                      void* arg)
+
+               group: group number
+               beg:   capture start position
+               end:   capture end position
+               level: nest level (from 0)
+               at:    callback position
+                      ONIG_TRAVERSE_CALLBACK_AT_FIRST
+                      ONIG_TRAVERSE_CALLBACK_AT_LAST
+               arg:   optional callback argument
+
+  4 arg;     optional callback argument.
+
+
+# int onig_noname_group_capture_is_active(regex_t* reg)
+
+  Return noname group capture activity.
+
+  active:   1
+  inactive: 0
+
+  arguments
+  1 reg:     regex object.
+
+  if option ONIG_OPTION_DONT_CAPTURE_GROUP == ON
+    --> inactive
+
+  if the regex pattern have named group
+     and syntax ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP == ON
+     and option ONIG_OPTION_CAPTURE_GROUP == OFF
+    --> inactive
+
+  else --> active
+
+
+# UChar* onigenc_get_prev_char_head(OnigEncoding enc, const UChar* start, const UChar* s)
+
+  Return previous character head address.
+
+  arguments
+  1 enc:   character encoding
+  2 start: string address
+  3 s:     target address of string
+
+
+# UChar* onigenc_get_left_adjust_char_head(OnigEncoding enc,
+                                           const UChar* start, const UChar* s)
+
+  Return left-adjusted head address of a character.
+
+  arguments
+  1 enc:   character encoding
+  2 start: string address
+  3 s:     target address of string
+
+
+# UChar* onigenc_get_right_adjust_char_head(OnigEncoding enc,
+                                            const UChar* start, const UChar* s)
+
+  Return right-adjusted head address of a character.
+
+  arguments
+  1 enc:   character encoding
+  2 start: string address
+  3 s:     target address of string
+
+
+# int onigenc_strlen(OnigEncoding enc, const UChar* s, const UChar* end)
+# int onigenc_strlen_null(OnigEncoding enc, const UChar* s)
+
+  Return number of characters in the string.
+
+
+# int onigenc_str_bytelen_null(OnigEncoding enc, const UChar* s)
+
+  Return number of bytes in the string.
+
+
+# int onig_set_default_syntax(OnigSyntaxType* syntax)
+
+  Set default syntax.
+
+  arguments
+  1 syntax: address of pattern syntax definition.
+
+
+# void onig_copy_syntax(OnigSyntaxType* to, OnigSyntaxType* from)
+
+  Copy syntax.
+
+  arguments
+  1 to:   destination address.
+  2 from: source address.
+
+
+# unsigned int onig_get_syntax_op(OnigSyntaxType* syntax)
+# unsigned int onig_get_syntax_op2(OnigSyntaxType* syntax)
+# unsigned int onig_get_syntax_behavior(OnigSyntaxType* syntax)
+# OnigOptionType onig_get_syntax_options(OnigSyntaxType* syntax)
+
+# void onig_set_syntax_op(OnigSyntaxType* syntax, unsigned int op)
+# void onig_set_syntax_op2(OnigSyntaxType* syntax, unsigned int op2)
+# void onig_set_syntax_behavior(OnigSyntaxType* syntax, unsigned int behavior)
+# void onig_set_syntax_options(OnigSyntaxType* syntax, OnigOptionType options)
+
+ Get/Set elements of the syntax.
+
+  arguments
+  1 syntax:  syntax
+  2 op, op2, behavior, options: value of element.
+
+
+# void onig_copy_encoding(OnigEncoding to, OnigOnigEncoding from)
+
+  Copy encoding.
+
+  arguments
+  1 to:   destination address.
+  2 from: source address.
+
+
+# int onig_set_meta_char(OnigEncoding enc, unsigned int what,
+                         OnigCodePoint code)
+
+  Set a variable meta character to the code point value.
+  Except for an escape character, this meta characters specification
+  is not work, if ONIG_SYN_OP_VARIABLE_META_CHARACTERS is not effective
+  by the syntax. (Build-in syntaxes are not effective.)
+
+  normal return: ONIG_NORMAL
+
+  arguments
+  1 enc:  target encoding
+  2 what: specifies which meta character it is.
+
+          ONIG_META_CHAR_ESCAPE
+          ONIG_META_CHAR_ANYCHAR
+          ONIG_META_CHAR_ANYTIME
+          ONIG_META_CHAR_ZERO_OR_ONE_TIME
+          ONIG_META_CHAR_ONE_OR_MORE_TIME
+          ONIG_META_CHAR_ANYCHAR_ANYTIME
+
+  3 code: meta character or ONIG_INEFFECTIVE_META_CHAR.
+
+
+# OnigAmbigType onig_get_default_ambig_flag()
+
+  Get default ambig flag.
+
+
+# int onig_set_default_ambig_flag(OnigAmbigType ambig_flag)
+
+  Set default ambig flag.
+
+  1 ambig_flag: ambiguity flag
+
+
+# unsigned int onig_get_match_stack_limit_size(void)
+
+  Return the maximum number of stack size.
+  (default: 0 == unlimited)
+
+
+# int onig_set_match_stack_limit_size(unsigned int size)
+
+  Set the maximum number of stack size.
+  (size = 0: unlimited)
+
+  normal return: ONIG_NORMAL
+
+
+# int onig_end(void)
+
+  The use of this library is finished.
+
+  normal return: ONIG_NORMAL
+
+  It is not allowed to use regex objects which created
+  before onig_end() call.
+
+
+# const char* onig_version(void)
+
+  Return version string.  (ex. "2.2.8")
+
+// END
diff --git a/ext/mbstring/oniguruma/doc/API.ja b/ext/mbstring/oniguruma/doc/API.ja
new file mode 100644
index 0000000000..2682da4808
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/API.ja
@@ -0,0 +1,593 @@
+���֥��󥿡��ե����� Version 4.1.0   2006/05/15
+
+#include <oniguruma.h>
+
+
+# int onig_init(void)
+
+  �饤�֥��ν����
+
+  onig_new()����ǸƤӽФ����Τǡ����δؿ�������Ū�˸ƤӽФ��ʤ��Ƥ�褤��
+
+
+# int onig_error_code_to_str(UChar* err_buf, int err_code, ...)
+
+  ���顼��å�������������롣
+
+  ���δؿ���onig_new()�η�̤��Ф��ƸƤӽФ����ˤϡ�onig_new()��pattern������
+  �����������������˸ƤӽФ��ʤ���Фʤ�ʤ���
+
+  ���ｪλ�����: ���顼��å�����ʸ����ΥХ���Ĺ
+
+  ����
+  1 err_buf:              ���顼��å��������Ǽ�����ΰ�
+                          (ɬ�פʥ�����: ONIG_MAX_ERROR_MESSAGE_LEN)
+  2 err_code:             ���顼������
+  3 err_info (optional):  onig_new()��err_info
+
+
+# void onig_set_warn_func(OnigWarnFunc func)
+
+  �ٹ����δؿ��򥻥åȤ��롣
+
+  �ٹ�:
+    '[', '-', ']' in character class without escape.
+    ']' in pattern without escape.
+
+  ����
+  1 func:    �ٹ�ؿ�    void (*func)(char* warning_message)
+
+
+# void onig_set_verb_warn_func(OnigWarnFunc func)
+
+  �ܺٷٹ����δؿ��򥻥åȤ��롣
+
+  �ܺٷٹ�:
+    redundant nested repeat operator.
+
+  ����
+  1 func:    �ܺٷٹ�ؿ�    void (*func)(char* warning_message)
+
+
+# int onig_new(regex_t** reg, const UChar* pattern, const UChar* pattern_end,
+            OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax,
+            OnigErrorInfo* err_info)
+
+  ����ɽ�����֥�������(regex)��������롣
+
+  ���ｪλ�����: ONIG_NORMAL
+
+  ����
+  1 reg:         �������줿����ɽ�����֥������Ȥ��֤����ɥ쥹
+  2 pattern:     ����ɽ���ѥ�����ʸ����
+  3 pattern_end: ����ɽ���ѥ�����ʸ����ν�ü���ɥ쥹(pattern + pattern length)
+  4 option:      ����ɽ������ѥ�������ץ����
+
+      ONIG_OPTION_NONE               ���ץ����ʤ�
+      ONIG_OPTION_SINGLELINE         '^' -> '\A', '$' -> '\z', '\Z' -> '\z'
+      ONIG_OPTION_MULTILINE          '.'�����Ԥ˥ޥå�����
+      ONIG_OPTION_IGNORECASE         ۣ��ޥå� ����
+      ONIG_OPTION_EXTEND             �ѥ������ĥ����
+      ONIG_OPTION_FIND_LONGEST       ��Ĺ�ޥå�
+      ONIG_OPTION_FIND_NOT_EMPTY     ���ޥå���̵��
+      ONIG_OPTION_NEGATE_SINGLELINE
+            ONIG_SYNTAX_POSIX_BASIC, ONIG_SYNTAX_POSIX_EXTENDED,
+            ONIG_SYNTAX_PERL, ONIG_SYNTAX_PERL_NG, ONIG_SYNTAX_JAVA��
+            �ǥե���Ȥ�ͭ����ONIG_OPTION_SINGLELINE�򥯥ꥢ���롣
+
+      ONIG_OPTION_DONT_CAPTURE_GROUP ̾���դ���ͼ�����Τ����
+      ONIG_OPTION_CAPTURE_GROUP      ̾��̵����ͼ���������
+
+  5 enc:        ʸ�����󥳡��ǥ���
+
+      ONIG_ENCODING_ASCII         ASCII
+      ONIG_ENCODING_ISO_8859_1    ISO 8859-1
+      ONIG_ENCODING_ISO_8859_2    ISO 8859-2
+      ONIG_ENCODING_ISO_8859_3    ISO 8859-3
+      ONIG_ENCODING_ISO_8859_4    ISO 8859-4
+      ONIG_ENCODING_ISO_8859_5    ISO 8859-5
+      ONIG_ENCODING_ISO_8859_6    ISO 8859-6
+      ONIG_ENCODING_ISO_8859_7    ISO 8859-7
+      ONIG_ENCODING_ISO_8859_8    ISO 8859-8
+      ONIG_ENCODING_ISO_8859_9    ISO 8859-9
+      ONIG_ENCODING_ISO_8859_10   ISO 8859-10
+      ONIG_ENCODING_ISO_8859_11   ISO 8859-11
+      ONIG_ENCODING_ISO_8859_13   ISO 8859-13
+      ONIG_ENCODING_ISO_8859_14   ISO 8859-14
+      ONIG_ENCODING_ISO_8859_15   ISO 8859-15
+      ONIG_ENCODING_ISO_8859_16   ISO 8859-16
+      ONIG_ENCODING_UTF8          UTF-8
+      ONIG_ENCODING_UTF16_BE      UTF-16BE
+      ONIG_ENCODING_UTF16_LE      UTF-16LE
+      ONIG_ENCODING_UTF32_BE      UTF-32BE
+      ONIG_ENCODING_UTF32_LE      UTF-32LE
+      ONIG_ENCODING_EUC_JP        EUC-JP
+      ONIG_ENCODING_EUC_TW        EUC-TW
+      ONIG_ENCODING_EUC_KR        EUC-KR
+      ONIG_ENCODING_EUC_CN        EUC-CN
+      ONIG_ENCODING_SJIS          Shift_JIS
+      ONIG_ENCODING_KOI8          KOI8
+      ONIG_ENCODING_KOI8_R        KOI8-R
+      ONIG_ENCODING_BIG5          Big5
+      ONIG_ENCODING_GB18030       GB 18030
+
+      �ޤ��ϡ��桼�����������OnigEncodingType�ǡ����Υ��ɥ쥹
+
+  6 syntax:     ����ɽ���ѥ�����ʸˡ���
+
+      ONIG_SYNTAX_ASIS              plain text
+      ONIG_SYNTAX_POSIX_BASIC       POSIX Basic RE
+      ONIG_SYNTAX_POSIX_EXTENDED    POSIX Extended RE
+      ONIG_SYNTAX_EMACS             Emacs
+      ONIG_SYNTAX_GREP              grep
+      ONIG_SYNTAX_GNU_REGEX         GNU regex
+      ONIG_SYNTAX_JAVA              Java (Sun java.util.regex)
+      ONIG_SYNTAX_PERL              Perl
+      ONIG_SYNTAX_PERL_NG           Perl + ̾���դ���ͼ�����
+      ONIG_SYNTAX_RUBY              Ruby
+      ONIG_SYNTAX_DEFAULT           default (== Ruby)
+                                    onig_set_default_syntax()
+
+      �ޤ��ϡ��桼�����������OnigSyntaxType�ǡ����Υ��ɥ쥹
+
+  7 err_info: ���顼������֤�����Υ��ɥ쥹
+              onig_error_code_to_str()�λ����ܤΰ����Ȥ��ƻ��Ѥ���
+
+
+# int onig_new_deluxe(regex_t** reg, const UChar* pattern, const UChar* pattern_end,
+                      OnigCompileInfo* ci, OnigErrorInfo* einfo)
+
+  ����ɽ�����֥�������(regex)��������롣
+  ���δؿ��ϡ�onig_new()�Υǥ�å����ǡ�
+
+  ���ｪλ�����: ONIG_NORMAL
+
+  ����
+  1 reg:         �������줿����ɽ�����֥������Ȥ��֤����ɥ쥹
+  2 pattern:     ����ɽ���ѥ�����ʸ����
+  3 pattern_end: ����ɽ���ѥ�����ʸ����ν�ü���ɥ쥹(pattern + pattern length)
+  4 ci:          ����ѥ������
+
+    ci->num_of_elements: ci�����ǿ� (���ߤ��ǤǤ�: 5)
+    ci->pattern_enc:     �ѥ�����ʸ�����ʸ�����󥳡��ǥ���
+    ci->target_enc:      �о�ʸ�����ʸ�����󥳡��ǥ���
+    ci->syntax:          ����ɽ���ѥ�����ʸˡ���
+    ci->option:          ����ɽ������ѥ�������ץ����
+    ci->ambig_flag:      ONIG_OPTION_IGNORECASE�⡼�ɤǤ�
+                         ʸ��ۣ��ޥå�����ӥåȥե饰
+
+       ONIGENC_AMBIGUOUS_MATCH_NONE:          ۣ��̵��
+       ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE:    ASCII����ʸ����ʸ��
+       ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE: ASCII�ʳ�����ʸ����ʸ��
+       ONIGENC_AMBIGUOUS_MATCH_COMPOUND:      ����ʸ��
+       ONIGENC_AMBIGUOUS_MATCH_FULL:          ���Ƥ�ۣ��ե饰ͭ��
+       ONIGENC_AMBIGUOUS_MATCH_DEFAULT:       (ASCII | NONASCII)
+                                              onig_set_default_ambig_flag()
+
+  5 err_info:    ���顼������֤�����Υ��ɥ쥹
+                 onig_error_code_to_str()�λ����ܤΰ����Ȥ��ƻ��Ѥ���
+
+
+  �ۤʤ�ʸ�����󥳡��ǥ��󥰤��Ȥ߹�碌�ϡ��ʲ��ξ��ˤΤߵ�����롣
+
+    pattern_enc: ASCII, ISO_8859_1
+    target_enc:  UTF16_BE, UTF16_LE, UTF32_BE, UTF32_LE
+
+    pattern_enc: UTF16_BE/LE
+    target_enc:  UTF16_LE/BE
+
+    pattern_enc: UTF32_BE/LE
+    target_enc:  UTF32_LE/BE
+
+
+# void onig_free(regex_t* reg)
+
+  ����ɽ�����֥������ȤΥ����������롣
+
+  ����
+  1 reg: ����ɽ�����֥�������
+
+
+
+# int onig_search(regex_t* reg, const UChar* str, const UChar* end, const UChar* start,
+                   const UChar* range, OnigRegion* region, OnigOptionType option)
+
+  ����ɽ����ʸ����򸡺�����������̤ȥޥå��ΰ���֤���
+
+  ���ｪλ�����: �ޥå����� (p - str >= 0)
+  ��������:       ONIG_MISMATCH (< 0)
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+  2 str:    �����о�ʸ����
+  3 end:    �����о�ʸ����ν�ü���ɥ쥹
+  4 start:  �����о�ʸ����θ�����Ƭ���ֳ��ϥ��ɥ쥹
+  5 range:  �����о�ʸ����θ�����Ƭ���ֽ�ü���ɥ쥹
+    ����õ��  (start <= õ�������ʸ�������Ƭ < range)
+    ����õ��  (range <= õ�������ʸ�������Ƭ <= start)
+  6 region: �ޥå��ΰ����(region)  (NULL��������)
+  7 option: ���������ץ����
+
+    ONIG_OPTION_NOTBOL        ʸ�������Ƭ(str)���Ƭ�ȴ������ʤ�
+    ONIG_OPTION_NOTEOL        ʸ����ν�ü(end)������ȴ������ʤ�
+    ONIG_OPTION_POSIX_REGION  region������POSIX API��regmatch_t[]�ˤ���
+
+
+# int onig_match(regex_t* reg, const UChar* str, const UChar* end, const UChar* at,
+		 OnigRegion* region, OnigOptionType option)
+
+  ʸ����λ�����֤ǥޥå��󥰤�Ԥ�����̤ȥޥå��ΰ���֤���
+
+  ���ｪλ�����: �ޥå������Х���Ĺ (>= 0)
+  not match:      ONIG_MISMATCH      ( < 0)
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+  2 str:    �����о�ʸ����
+  3 end:    �����о�ʸ����ν�ü���ɥ쥹
+  4 at:     �����о�ʸ����θ������ɥ쥹
+  5 region: �ޥå��ΰ����(region)  (NULL��������)
+  6 option: ���������ץ����
+
+    ONIG_OPTION_NOTBOL        ʸ�������Ƭ(str)���Ƭ�ȴ������ʤ�
+    ONIG_OPTION_NOTEOL        ʸ����ν�ü(end)������ȴ������ʤ�
+    ONIG_OPTION_POSIX_REGION  region������POSIX API��regmatch_t[]�ˤ���
+
+
+# OnigRegion* onig_region_new(void)
+
+  �ޥå��ΰ����(region)��������롣
+
+
+# void onig_region_free(OnigRegion* region, int free_self)
+
+  �ޥå��ΰ����(region)�ǻ��Ѥ���Ƥ�������������롣
+
+  ����
+  1 region:    �ޥå��ΰ���󥪥֥�������
+  2 free_self:  [1: region���Ȥ�ޤ�����Ʋ���, 0: region���Ȥϲ������ʤ�]
+
+
+# void onig_region_copy(OnigRegion* to, OnigRegion* from)
+
+  �ޥå��ΰ����(region)��ʣ�����롣
+
+  ����
+  1 to:   �о��ΰ�
+  2 from: ���ΰ�
+
+
+# void onig_region_clear(OnigRegion* region)
+
+  �ޥå��ΰ����(region)����̣�򥯥ꥢ���롣
+
+  ����
+  1 region: �о��ΰ�
+
+
+# int onig_region_resize(OnigRegion* region, int n)
+
+  �ޥå��ΰ����(region)����ͼ�����(���롼��)�����ѹ����롣
+
+  ���ｪλ�����: ONIG_NORMAL
+
+  ����
+  1 region: �о��ΰ�
+  2 n:      ������������
+
+
+# int onig_name_to_group_numbers(regex_t* reg, const UChar* name, const UChar* name_end,
+                                  int** num_list)
+
+  ���ꤷ��̾�����Ф���̾���դ���ͼ�����(���롼��)��
+  ���롼���ֹ�ꥹ�Ȥ��֤���
+  ̾���դ���ͼ�����ϡ�(?<name>....)�ˤ�ä�����Ǥ��롣
+
+  ���ｪλ�����:  ���ꤵ�줿̾�����Ф��륰�롼�׿�
+                   (�� /(?<x>..)(?<x>..)/  ==>  2)
+  ̾�����Ф��륰�롼�פ�¸�ߤ��ʤ�: -1
+
+  ����
+  1 reg:       ����ɽ�����֥�������
+  2 name:      ��ͼ�����(���롼��)̾
+  3 name_end:  ��ͼ�����(���롼��)̾�ν�ü���ɥ쥹
+  4 num_list:  �ֹ�ꥹ�Ȥ��֤����ɥ쥹
+
+
+# int onig_name_to_backref_number(regex_t* reg, const UChar* name, const UChar* name_end,
+                                  OnigRegion *region)
+
+  ���ꤵ�줿̾���θ�������(\k<name>)���Ф�����ͼ�����(���롼��)���ֹ���֤���
+  ̾�����Ф��ơ�ʣ���Υޥå��ΰ褬ͭ���Ǥ���С�������κ�����ֹ���֤���
+  ̾�����Ф�����ͼ����礬��Ĥ����ʤ��Ȥ��ˤϡ��б�����ޥå��ΰ褬ͭ����
+  �ɤ����˴ط��ʤ��������ֹ���֤���(���äơ�region�ˤ�NULL���Ϥ��Ƥ�褤��)
+
+  ���ｪλ�����: �ֹ�
+
+  ����
+  1 reg:       ����ɽ�����֥�������
+  2 name:      ��ͼ�����(���롼��)̾
+  3 name_end:  ��ͼ�����(���롼��)̾�ν�ü���ɥ쥹
+  4 region:    search/match��̤Υޥå��ΰ�
+
+
+# int onig_foreach_name(regex_t* reg,
+                        int (*func)(const UChar*, const UChar*, int,int*,regex_t*,void*),
+                        void* arg)
+
+  ���Ƥ�̾�����Ф��ƥ�����Хå��ؿ��ƤӽФ���¹Ԥ��롣
+
+  ���ｪλ�����: 0
+  ���顼:         ������Хå��ؿ��������
+
+  ����
+  1 reg:     ����ɽ�����֥�������
+  2 func:    ������Хå��ؿ�
+             func(name, name_end, <number of groups>, <group number's list>,
+                  reg, arg);
+
+             func��0�ʳ����ͤ��֤��ȡ�����ʹߤΥ�����Хå��ϹԤʤ鷺��
+             ��λ���롣
+
+  3 arg:     func���Ф����ɲð���
+
+
+# int onig_number_of_names(regex_t* reg)
+
+  �ѥ��������������줿̾���ο����֤���
+  ��Ĥ�̾����¿������ϰ�Ĥȴ�������
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+
+
+# OnigEncoding    onig_get_encoding(regex_t* reg)
+# OnigOptionType  onig_get_options(regex_t* reg)
+# OnigAmbigType   onig_get_ambig_flag(regex_t* reg)
+# OnigSyntaxType* onig_get_syntax(regex_t* reg)
+
+  ����ɽ�����֥������Ȥ��Ф��ơ��б������ͤ��֤���
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+
+
+# int onig_number_of_captures(regex_t* reg)
+
+  �ѥ��������������줿��ͥ��롼�פο����֤���
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+
+
+# int onig_number_of_capture_histories(regex_t* reg)
+
+  �ѥ��������������줿�������(?@...)�ο����֤���
+
+  ���Ѥ���ʸˡ���������ǽ��ͭ��(ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY)
+  �Ǥʤ���С��������ǽ�ϻ��ѤǤ��ʤ���
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+
+
+# OnigCaptureTreeNode* onig_get_capture_tree(OnigRegion* region)
+
+  �������ǡ����Υ롼�ȥΡ��ɤ��֤���
+
+  �ޥå������Ԥ��Ƥ�����ˤϡ������ͤ�����Ǥ��롣
+
+  ����
+  1 region: �ޥå��ΰ�
+
+
+# int onig_capture_tree_traverse(OnigRegion* region, int at,
+                  int(*func)(int,int,int,int,int,void*), void* arg)
+
+  �������ǡ����ڤ��󤷤ƥ�����Хå����롣
+
+  ���ｪλ�����: 0
+  ���顼:         ������Хå��ؿ��������
+
+  ����
+  1 region:  �ޥå��ΰ�
+  2 at:      ������Хå���Ԥʤ������ߥ�
+
+    ONIG_TRAVERSE_CALLBACK_AT_FIRST:
+        �ǽ�˥�����Хå����ơ��ҥΡ��ɤ���
+    ONIG_TRAVERSE_CALLBACK_AT_LAST:
+        �ҥΡ��ɤ��󤷤ơ�������Хå�
+    ONIG_TRAVERSE_CALLBACK_AT_BOTH:
+        �ǽ�˥�����Хå����ơ��ҥΡ��ɤ��󡢺Ǹ�ˤ⤦���٥�����Хå�
+
+  3 func:    ������Хå��ؿ�
+             func��0�ʳ����ͤ��֤��ȡ�����ʹߤν��ϹԤʤ鷺��
+             ��λ���롣
+
+             int func(int group, int beg, int end, int level, int at,
+                      void* arg)
+               group: ���롼���ֹ�
+               beg:   �ޥå����ϰ���
+               end    �ޥå���λ����
+               level: �ͥ��ȥ�٥� (0����)
+               at:    ������Хå����ƤӽФ��줿�����ߥ�
+                      ONIG_TRAVERSE_CALLBACK_AT_FIRST
+                      ONIG_TRAVERSE_CALLBACK_AT_LAST
+               arg:   �ɲð���
+
+  4 arg;     func���Ф����ɲð���
+
+
+# int onig_noname_group_capture_is_active(regex_t* reg)
+
+  ̾���ʤ����������͵�ǽ��ͭ�����ɤ������֤���
+
+  ͭ��: 1
+  ̵��: 0
+
+  ����
+  1 reg:    ����ɽ�����֥�������
+
+
+  ���ץ�����ONIG_OPTION_DONT_CAPTURE_GROUP��ON --> ̵��
+
+  �ѥ�����̾���Ĥ����������Ѥ��Ƥ���
+  AND ����ʸˡ�ǡ�ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP��ON
+  AND ���ץ�����ONIG_OPTION_CAPTURE_GROUP��OFF
+  --> ̵��
+
+  �嵭�ʳ��ξ�� --> ͭ��
+
+
+# UChar* onigenc_get_prev_char_head(OnigEncoding enc, const UChar* start, const UChar* s)
+
+  ʸ�����ʬ����ʸ������֤��֤���
+
+  ����
+  1 enc:   ʸ�����󥳡��ǥ���
+  2 start: ʸ�������Ƭ���ɥ쥹
+  3 s:     ʸ������ΰ���
+
+
+# UChar* onigenc_get_left_adjust_char_head(OnigEncoding enc,
+                                           const UChar* start, const UChar* s)
+
+  ʸ������Ƭ�Х��Ȱ��֤ˤʤ�褦�˺�¦��Ĵ���������ɥ쥹���֤���
+
+  ����
+  1 enc:   ʸ�����󥳡��ǥ���
+  2 start: ʸ�������Ƭ���ɥ쥹
+  3 s:     ʸ������ΰ���
+
+
+# UChar* onigenc_get_right_adjust_char_head(OnigEncoding enc,
+                                            const UChar* start, const UChar* s)
+
+  ʸ������Ƭ�Х��Ȱ��֤ˤʤ�褦�˱�¦��Ĵ���������ɥ쥹���֤���
+
+  ����
+  1 enc:   ʸ�����󥳡��ǥ���
+  2 start: ʸ�������Ƭ���ɥ쥹
+  3 s:     ʸ������ΰ���
+
+
+# int onigenc_strlen(OnigEncoding enc, const UChar* s, const UChar* end)
+# int onigenc_strlen_null(OnigEncoding enc, const UChar* s)
+
+  ʸ�����ʸ�������֤���
+
+
+# int onigenc_str_bytelen_null(OnigEncoding enc, const UChar* s)
+
+  ʸ����ΥХ��ȿ����֤���
+
+
+# int onig_set_default_syntax(OnigSyntaxType* syntax)
+
+  �ǥե���Ȥ�����ɽ���ѥ�����ʸˡ�򥻥åȤ��롣
+
+  ����
+  1 syntax: ����ɽ���ѥ�����ʸˡ
+
+
+# void onig_copy_syntax(OnigSyntaxType* to, OnigSyntaxType* from)
+
+  ����ɽ���ѥ�����ʸˡ�򥳥ԡ����롣
+
+  ����
+  1 to:   �о�
+  2 from: ��
+
+
+# unsigned int onig_get_syntax_op(OnigSyntaxType* syntax)
+# unsigned int onig_get_syntax_op2(OnigSyntaxType* syntax)
+# unsigned int onig_get_syntax_behavior(OnigSyntaxType* syntax)
+# OnigOptionType onig_get_syntax_options(OnigSyntaxType* syntax)
+
+# void onig_set_syntax_op(OnigSyntaxType* syntax, unsigned int op)
+# void onig_set_syntax_op2(OnigSyntaxType* syntax, unsigned int op2)
+# void onig_set_syntax_behavior(OnigSyntaxType* syntax, unsigned int behavior)
+# void onig_set_syntax_options(OnigSyntaxType* syntax, OnigOptionType options)
+
+  ����ɽ���ѥ�����ʸˡ�����Ǥ򻲾�/�������롣
+
+  ����
+  1 syntax:                     ����ɽ���ѥ�����ʸˡ
+  2 op, op2, behavior, options: ���Ǥ���
+
+
+# void onig_copy_encoding(OnigEncoding to, OnigOnigEncoding from)
+
+  ʸ�����󥳡��ǥ��󥰤򥳥ԡ����롣
+
+  ����
+  1 to:   �о�
+  2 from: ��
+
+
+# int onig_set_meta_char(OnigEncoding enc, unsigned int what,
+                         OnigCodePoint code)
+
+  �᥿ʸ������ꤷ�������ɥݥ�����ͤ˥��åȤ��롣
+  ONIG_SYN_OP_VARIABLE_META_CHARACTERS������ɽ���ѥ�����ʸˡ��ͭ����
+  �ʤäƤ��ʤ����ˤϡ�����������ʸ��������ơ������ǻ��ꤷ���᥿ʸ����
+  ��ǽ���ʤ���(�ȹ��ߤ�ʸˡ�Ǥ�ͭ���ˤ��Ƥ��ʤ���)
+
+  ���ｪλ�����: ONIG_NORMAL
+
+  ����
+  1 enc:  �о�ʸ�����󥳡��ǥ���
+  2 what: �᥿ʸ����ǽ�λ���
+
+          ONIG_META_CHAR_ESCAPE
+          ONIG_META_CHAR_ANYCHAR
+          ONIG_META_CHAR_ANYTIME
+          ONIG_META_CHAR_ZERO_OR_ONE_TIME
+          ONIG_META_CHAR_ONE_OR_MORE_TIME
+          ONIG_META_CHAR_ANYCHAR_ANYTIME
+
+  3 code: �᥿ʸ���Υ����ɥݥ���� �ޤ��� ONIG_INEFFECTIVE_META_CHAR.
+
+
+# OnigAmbigType onig_get_default_ambig_flag()
+
+  �ǥե���Ȥ�ۣ��ޥå��ե饰��������롣
+
+
+# int onig_set_default_ambig_flag(OnigAmbigType ambig_flag)
+
+  �ǥե���Ȥ�ۣ��ޥå��ե饰�򥻥åȤ��롣
+
+  ����
+  1 ambig_flag: ۣ��ޥå��ե饰
+
+
+# unsigned int onig_get_match_stack_limit_size(void)
+
+  �ޥå������å��������κ����ͤ��֤���
+  (�ǥե����: 0 == ̵����)
+
+
+# int onig_set_match_stack_limit_size(unsigned int size)
+
+  �ޥå������å��������κ����ͤ���ꤹ�롣
+  (size = 0: ̵����)
+
+  ���ｪλ�����: ONIG_NORMAL
+
+
+# int onig_end(void)
+
+  �饤�֥��λ��Ѥ�λ���롣
+
+  ���ｪλ�����: ONIG_NORMAL
+
+  onig_init()����ٸƤӽФ��Ƥ⡢�����˺�����������ɽ�����֥�������
+  ����Ѥ��뤳�ȤϤǤ��ʤ���
+
+
+# const char* onig_version(void)
+
+  �С������ʸ������֤���(�� "2.2.8")
+
+// END
diff --git a/ext/mbstring/oniguruma/doc/FAQ b/ext/mbstring/oniguruma/doc/FAQ
new file mode 100644
index 0000000000..1621a359eb
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/FAQ
@@ -0,0 +1,33 @@
+FAQ    2006/05/15
+
+1. Lognest match
+
+   You can execute longest match by using ONIG_OPTION_FIND_LONGEST option
+   in onig_new().
+
+
+2. Thread safe
+
+   In order to make thread safe, which of (A) or (B) must be done.
+
+   (A) Oniguruma Layer
+
+       Define the macro below at NOT_RUBY case in oniguruma/regint.h.
+
+       USE_MULTI_THREAD_SYSTEM
+       THREAD_ATOMIC_START
+       THREAD_ATOMIC_END
+       THREAD_PASS
+
+   (B) Application Layer
+
+       The plural threads should not do simultaneously that making 
+       new regexp objects or re-compiling objects or freeing objects,
+       even if these objects are differ.
+
+
+3. Mailing list
+
+   There is no mailing list about Oniguruma.
+
+// END
diff --git a/ext/mbstring/oniguruma/doc/FAQ.ja b/ext/mbstring/oniguruma/doc/FAQ.ja
new file mode 100644
index 0000000000..5f61b09554
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/FAQ.ja
@@ -0,0 +1,115 @@
+FAQ    2006/05/15
+
+1. ��Ĺ�ޥå�
+
+   onig_new()����ǡ�ONIG_OPTION_FIND_LONGEST���ץ����
+   ����Ѥ���к�Ĺ�ޥå��ˤʤ롣
+
+
+2. ����åɥ�����
+
+   ����åɥ����դˤ���ˤϡ��ʲ���(A)��(B)�Τɤ��餫��Ԥʤ���
+   �褤��
+
+   (A) Oniguruma Layer
+
+       oniguruma/regint.h�����NOT_RUBY����ʬ�ΰʲ��Υޥ�����������롣
+
+       USE_MULTI_THREAD_SYSTEM
+       THREAD_ATOMIC_START
+       THREAD_ATOMIC_END
+       THREAD_PASS
+
+   (B) Application Layer
+
+       Ʊ����ʣ���Υ���åɤ�������ɽ�����֥������Ȥ�������롢
+       �ޤ��ϲ������롢���Ȥ�ԤʤäƤϤʤ�ʤ���
+       �����Υ��֥������Ȥ������̤Τ�ΤǤ��äƤ⡣
+
+   �⤦�����ܤ��������ϡ����Υɥ�����Ȥ����
+   "����åɥ����դ˴ؤ�����"�˽񤤤Ƥ�������
+
+
+3. �᡼��󥰥ꥹ��
+
+   ���֤˴ؤ���᡼��󥰥ꥹ�Ȥ�¸�ߤ��ʤ���
+
+//END
+
+
+
+����åɥ����դ˴ؤ�����
+
+����åɥ����դˤ���ˤϡ����̤Υ��ץꥱ����������ǹԤ�����
+Oniguruma�饤�֥�����ǹԤ������ɤ��餫�����֤��Ȥ��Ǥ��ޤ���
+(Oniguruma����Ѥ���¦���н褹�뤫��Oniguruma���н褵���뤫
+�ɤ��餫�����ǹԤ�ɬ�פ�����Ȥ������ȤǤ���)
+
+��������ˡ�ˤĤ��ơ��ʲ�(A)��(B)���������ޤ���
+
+�ޥ������å�API�ϡ����줾��Υץ�åȥե�����ˤ�äƤ�
+�ۤʤ�ޤ��Τǡ��ʲ�����������Ƕ���Ū�˲���Ƥ֤Τ���
+�񤯤��Ȥ�̵���Ǥ����ºݤ˻��Ѥ����ޥ������å�API�ǡ�
+�б����뵡ǽ�Τ�Τ���ꤷ�Ƥ���������
+
+(A) Oniguruma������б�������
+
+oniguruma/regint.h�����NOT_RUBY�ǰϤޤ�Ƥ�����ʬ�����
+�ʲ��Υޥ�����������ƺƥ���ѥ��뤷�Ƥ���������
+
+USE_MULTI_THREAD_SYSTEM
+
+  ñ��ͭ���ˤ���Ф褤�Ǥ���
+
+THREAD_ATOMIC_START
+THREAD_ATOMIC_END
+
+  THREAD_ATOMIC_START����THREAD_ATOMIC_END�ǰϤޤ줿
+  �ץ������Υ�������ʬ�򤢤륹��åɤ��¹���ˡ�¾��
+  ����åɤ˼¹Ը�����ư���ʤ����Ȥ��ݾ㤹���Τ����
+  ���Ƥ���������
+  (̾�����̤ꡢ�Ϥޤ줿��������ʬ�򥹥�åɥ��ȥߥå���
+   ����Ȥ�����̣)
+
+THREAD_PASS
+
+  �����¹Ԥ�������åɤ��顢¾�Υ���åɤ˼¹Ը���Ѿ�
+  �����Τ�����򤷤Ƥ���������(�ƥ������塼���ƤӽФ�
+  �Ȥ�����̣)
+  �б����뵡ǽ�������ʤ���С�������ˤ��Ƥ���������
+
+(������)
+Ruby�ξ�����ˤ���ȡ�
+Ruby�ϼ�ʬ���Ȥ��ȼ��Υ���åɵ�ǽ��������Ƥ��ޤ���
+���ε�ǽ����Ѥ���ȡ��ʲ��Τ褦���������Ф褤���Ȥ�
+�ʤ�ޤ���
+
+#define USE_MULTI_THREAD_SYSTEM
+#define THREAD_ATOMIC_START       DEFER_INTS
+#define THREAD_ATOMIC_END         ENABLE_INTS
+#define THREAD_PASS               rb_thread_schedule()
+
+Ruby�ξ�硢�����޳����ߤ���Ѥ��ơ�����åɤ��ڤ��ؤ���
+�ԤäƤ��ޤ���DEFER_INTS�ϳ����ߥϥ�ɥ�μ¹Ԥ���Ū��
+�ߤ�뤿��Υޥ����Ǥ���ENABLE_INTS�ޥ����ǳ����ߥϥ�ɥ�
+�μ¹Ԥ���Ĥ��ޤ���
+����ˤ�äơ�THREAD_ATOMIC_START����THREAD_ATOMIC_END
+�ǰϤޤ줿��ʬ�μ¹���ˡ�¾�Υ���åɤ˼¹Ը�����ư���ޤ���
+
+
+(B) ���ץꥱ������������б�������
+
+�ʲ����ݾ㤹��褦�ˡ�����åɤμ¹Ԥ����椷�Ƥ���������
+
+Ʊ����ʣ���Υ���åɤ�������ɽ�����֥������Ȥ�������롢�ޤ��ϲ������롢���Ȥ�
+�ԤʤäƤϤʤ�ʤ��������Υ��֥������Ȥ������̤Τ�ΤǤ��äƤ⡣
+
+onig_new(), onig_new_deluxe(), onig_free()�Τɤ줫�θƤӽФ���
+ʣ���Υ���åɤ�Ʊ���˼¹Ԥ��뤳�Ȥ��򤱤Ƥ���������Ʊ���Ǥʤ�����̤ˤ��ޤ��ޤ���
+
+����ϲ���ɬ�פʤΤ��Ȥ����ȡ�����ɽ�����֥������Ȥ��������
+�����ǡ������Ƕ��̤˻��Ȥ���ơ��֥뤬����ޤ���
+���Υơ��֥���Ф��ƤΥǡ�����Ͽ������ʣ���Υ���åɤǾ��ͤ���
+�۾�ʾ��֤ˤʤ�ʤ������ɬ�פǤ���
+
+// END
diff --git a/ext/mbstring/oniguruma/doc/RE b/ext/mbstring/oniguruma/doc/RE
new file mode 100644
index 0000000000..5a2783d167
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/RE
@@ -0,0 +1,412 @@
+Oniguruma Regular Expressions Version 4.3.0    2006/08/17
+
+syntax: ONIG_SYNTAX_RUBY (default)
+
+
+1. Syntax elements
+
+  \       escape (enable or disable meta character meaning)
+  |       alternation
+  (...)   group
+  [...]   character class  
+
+
+2. Characters
+
+  \t           horizontal tab (0x09)
+  \v           vertical tab   (0x0B)
+  \n           newline        (0x0A)
+  \r           return         (0x0D)
+  \b           back space     (0x08)
+  \f           form feed      (0x0C)
+  \a           bell           (0x07)
+  \e           escape         (0x1B)
+  \nnn         octal char            (encoded byte value)
+  \xHH         hexadecimal char      (encoded byte value)
+  \x{7HHHHHHH} wide hexadecimal char (character code point value)
+  \cx          control char          (character code point value)
+  \C-x         control char          (character code point value)
+  \M-x         meta  (x|0x80)        (character code point value)
+  \M-\C-x      meta control char     (character code point value)
+
+ (* \b is effective in character class [...] only)
+
+
+3. Character types
+
+  .        any character (except newline)
+
+  \w       word character
+
+           Not Unicode:
+             alphanumeric, "_" and multibyte char. 
+
+           Unicode:
+             General_Category -- (Letter|Mark|Number|Connector_Punctuation)
+
+  \W       non word char
+
+  \s       whitespace char
+
+           Not Unicode:
+             \t, \n, \v, \f, \r, \x20
+
+           Unicode:
+             0009, 000A, 000B, 000C, 000D, 0085(NEL), 
+             General_Category -- Line_Separator
+                              -- Paragraph_Separator
+                              -- Space_Separator
+
+  \S       non whitespace char
+
+  \d       decimal digit char
+
+           Unicode: General_Category -- Decimal_Number
+
+  \D       non decimal digit char
+
+  \h       hexadecimal digit char   [0-9a-fA-F]
+
+  \H       non hexadecimal digit char
+
+
+4. Quantifier
+
+  greedy
+
+    ?       1 or 0 times
+    *       0 or more times
+    +       1 or more times
+    {n,m}   at least n but not more than m times
+    {n,}    at least n times
+    {,n}    at least 0 but not more than n times ({0,n})
+    {n}     n times
+
+  reluctant
+
+    ??      1 or 0 times
+    *?      0 or more times
+    +?      1 or more times
+    {n,m}?  at least n but not more than m times  
+    {n,}?   at least n times
+    {,n}?   at least 0 but not more than n times (== {0,n}?)
+
+  possessive (greedy and does not backtrack after repeated)
+
+    ?+      1 or 0 times
+    *+      0 or more times
+    ++      1 or more times
+
+    ({n,m}+, {n,}+, {n}+ are possessive op. in ONIG_SYNTAX_JAVA only)
+
+    ex. /a*+/ === /(?>a*)/
+
+
+5. Anchors
+
+  ^       beginning of the line
+  $       end of the line
+  \b      word boundary
+  \B      not word boundary
+  \A      beginning of string
+  \Z      end of string, or before newline at the end
+  \z      end of string
+  \G      matching start position (*)
+
+          * Ruby Regexp:
+                 previous end-of-match position
+                (This specification is not related to this library.)
+
+
+6. Character class
+
+  ^...    negative class (lowest precedence operator)
+  x-y     range from x to y
+  [...]   set (character class in character class)
+  ..&&..  intersection (low precedence at the next of ^)
+          
+    ex. [a-w&&[^c-g]z] ==> ([a-w] AND ([^c-g] OR z)) ==> [abh-w]
+
+  * If you want to use '[', '-', ']' as a normal character
+    in a character class, you should escape these characters by '\'.
+
+
+  POSIX bracket ([:xxxxx:], negate [:^xxxxx:])
+
+    Not Unicode Case:
+
+    alnum    alphabet or digit char
+    alpha    alphabet
+    ascii    code value: [0 - 127]
+    blank    \t, \x20
+    cntrl
+    digit    0-9
+    graph    include all of multibyte encoded characters
+    lower
+    print    include all of multibyte encoded characters
+    punct
+    space    \t, \n, \v, \f, \r, \x20
+    upper
+    xdigit   0-9, a-f, A-F
+
+
+    Unicode Case:
+
+    alnum    Letter | Mark | Decimal_Number
+    alpha    Letter | Mark
+    ascii    0000 - 007F
+    blank    Space_Separator | 0009
+    cntrl    Control | Format | Unassigned | Private_Use | Surrogate
+    digit    Decimal_Number
+    graph    [[:^space:]] && ^Control && ^Unassigned && ^Surrogate
+    lower    Lowercase_Letter
+    print    [[:graph:]] | [[:space:]]
+    punct    Connector_Punctuation | Dash_Punctuation | Close_Punctuation |
+             Final_Punctuation | Initial_Punctuation | Other_Punctuation |
+             Open_Punctuation
+    space    Space_Separator | Line_Separator | Paragraph_Separator |
+             0009 | 000A | 000B | 000C | 000D | 0085
+    upper    Uppercase_Letter
+    xdigit   0030 - 0039 | 0041 - 0046 | 0061 - 0066
+             (0-9, a-f, A-F)
+
+
+7. Extended groups
+
+  (?#...)            comment
+
+  (?imx-imx)         option on/off
+                         i: ignore case
+                         m: multi-line (dot(.) match newline)
+                         x: extended form
+  (?imx-imx:subexp)  option on/off for subexp
+
+  (?:subexp)         not captured group
+  (subexp)           captured group
+
+  (?=subexp)         look-ahead
+  (?!subexp)         negative look-ahead
+  (?<=subexp)        look-behind
+  (?<!subexp)        negative look-behind
+
+                     Subexp of look-behind must be fixed character length.
+                     But different character length is allowed in top level
+                     alternatives only.
+                     ex. (?<=a|bc) is OK. (?<=aaa(?:b|cd)) is not allowed.
+
+                     In negative-look-behind, captured group isn't allowed, 
+                     but shy group(?:) is allowed.
+
+  (?>subexp)         atomic group
+                     don't backtrack in subexp.
+
+  (?<name>subexp)    define named group
+                     (All characters of the name must be a word character.
+                     And first character must not be a digit or uppper case)
+
+                     Not only a name but a number is assigned like a captured
+                     group.
+
+                     Assigning the same name as two or more subexps is allowed.
+                     In this case, a subexp call can not be performed although
+                     the back reference is possible.
+
+
+8. Back reference
+
+  \n          back reference by group number (n >= 1)
+  \k<name>    back reference by group name
+
+  In the back reference by the multiplex definition name,
+  a subexp with a large number is referred to preferentially.
+  (When not matched, a group of the small number is referred to.)
+
+  * Back reference by group number is forbidden if named group is defined 
+    in the pattern and ONIG_OPTION_CAPTURE_GROUP is not setted.
+
+
+  back reference with nest level
+
+    (This function is disabled in Ruby 1.9.)
+
+    \k<name+n>     n: 0, 1, 2, ...
+    \k<name-n>     n: 0, 1, 2, ...
+
+    Destinate relative nest level from back reference position.    
+
+    ex 1.
+
+      /\A(?<a>|.|(?:(?<b>.)\g<a>\k<b+0>))\z/.match("reer")
+
+    ex 2.
+
+      r = Regexp.compile(<<'__REGEXP__'.strip, Regexp::EXTENDED)
+      (?<element> \g<stag> \g<content>* \g<etag> ){0}
+      (?<stag> < \g<name> \s* > ){0}
+      (?<name> [a-zA-Z_:]+ ){0}
+      (?<content> [^<&]+ (\g<element> | [^<&]+)* ){0}
+      (?<etag> </ \k<name+1> >){0}
+      \g<element>
+      __REGEXP__
+
+      p r.match('<foo>f<bar>bbb</bar>f</foo>').captures
+
+
+
+9. Subexp call ("Tanaka Akira special")
+
+  \g<name>    call by group name
+  \g<n>       call by group number (n >= 1)
+
+  * left-most recursive call is not allowed.
+     ex. (?<name>a|\g<name>b)   => error
+         (?<name>a|b\g<name>c)  => OK
+
+  * Call by group number is forbidden if named group is defined in the pattern
+    and ONIG_OPTION_CAPTURE_GROUP is not setted.
+
+  * If the option status of called group is different from calling position
+    then the group's option is effective.
+
+    ex. (?-i:\g<name>)(?i:(?<name>a)){0}  match to "A"
+
+
+10. Captured group
+
+  Behavior of the no-named group (...) changes with the following conditions.
+  (But named group is not changed.)
+
+  case 1. /.../     (named group is not used, no option)
+
+     (...) is treated as a captured group.
+
+  case 2. /.../g    (named group is not used, 'g' option)
+
+     (...) is treated as a no-captured group (?:...).
+
+  case 3. /..(?<name>..)../   (named group is used, no option)
+
+     (...) is treated as a no-captured group (?:...).
+     numbered-backref/call is not allowed.
+
+  case 4. /..(?<name>..)../G  (named group is used, 'G' option)
+
+     (...) is treated as a captured group.
+     numbered-backref/call is allowed.
+
+  where
+    g: ONIG_OPTION_DONT_CAPTURE_GROUP
+    G: ONIG_OPTION_CAPTURE_GROUP
+
+  ('g' and 'G' options are argued in ruby-dev ML)
+
+  These options are not implemented in Ruby level.
+
+
+-----------------------------
+A-1. Syntax depend options
+
+   + ONIG_SYNTAX_RUBY
+     (?m): dot(.) match newline
+
+   + ONIG_SYNTAX_PERL and ONIG_SYNTAX_JAVA
+     (?s): dot(.) match newline
+     (?m): ^ match after newline, $ match before newline
+
+
+A-2. Original extensions
+
+   + hexadecimal digit char type  \h, \H
+   + named group                  (?<name>...)
+   + named backref                \k<name>
+   + subexp call                  \g<name>, \g<group-num>
+
+
+A-3. Lacked features compare with perl 5.8.0
+
+   + [:word:]
+   + \N{name}
+   + \l,\u,\L,\U, \X, \C
+   + (?{code})
+   + (??{code})
+   + (?(condition)yes-pat|no-pat)
+
+   * \Q...\E
+     This is effective on ONIG_SYNTAX_PERL and ONIG_SYNTAX_JAVA.
+
+   * \p{property}, \P{property}
+     This is effective on ONIG_SYNTAX_PERL and ONIG_SYNTAX_JAVA.
+     Alnum, Alpha, Blank, Cntrl, Digit, Graph, Lower,
+     Print, Punct, Space, Upper, XDigit, ASCII are supported.
+
+     Prefix 'Is' of property name is allowed in ONIG_SYNTAX_PERL only.
+     ex. \p{IsXDigit}.
+
+     Negation operator of property is supported in ONIG_SYNTAX_PERL only.
+     \p{^...}, \P{^...}
+
+
+A-4. Differences with Japanized GNU regex(version 0.12) of Ruby
+
+   + add hexadecimal digit char type (\h, \H)
+   + add look-behind
+     (?<=fixed-char-length-pattern), (?<!fixed-char-length-pattern)
+   + add possessive quantifier. ?+, *+, ++
+   + add operations in character class. [], &&
+     ('[' must be escaped as an usual char in character class.)
+   + add named group and subexp call.
+   + octal or hexadecimal number sequence can be treated as 
+     a multibyte code char in character class if multibyte encoding
+     is specified.
+     (ex. [\xa1\xa2], [\xa1\xa7-\xa4\xa1])
+   + allow the range of single byte char and multibyte char in character
+     class.
+     ex. /[a-<<any EUC-JP character>>]/ in EUC-JP encoding.
+   + effect range of isolated option is to next ')'.
+     ex. (?:(?i)a|b) is interpreted as (?:(?i:a|b)), not (?:(?i:a)|b).
+   + isolated option is not transparent to previous pattern.
+     ex. a(?i)* is a syntax error pattern.
+   + allowed incompleted left brace as an usual string.
+     ex. /{/, /({)/, /a{2,3/ etc...
+   + negative POSIX bracket [:^xxxx:] is supported.
+   + POSIX bracket [:ascii:] is added.
+   + repeat of look-ahead is not allowed.
+     ex. /(?=a)*/, /(?!b){5}/
+   + Ignore case option is effective to numbered character.
+     ex. /\x61/i =~ "A"
+   + In the range quantifier, the number of the minimum is omissible.
+     /a{,n}/ == /a{0,n}/
+     The simultanious abbreviation of the number of times of the minimum
+     and the maximum is not allowed. (/a{,}/)
+   + /a{n}?/ is not a non-greedy operator.
+     /a{n}?/ == /(?:a{n})?/
+   + invalid back reference is checked and cause error.
+     /\1/, /(a)\2/
+   + Zero-length match in infinite repeat stops the repeat,
+     then changes of the capture group status are checked as stop condition.
+     /(?:()|())*\1\2/ =~ ""
+     /(?:\1a|())*/ =~ "a"
+
+
+A-5. Disabled functions by default syntax
+
+   + capture history
+
+     (?@...) and (?@<name>...)
+
+     ex. /(?@a)*/.match("aaa") ==> [<0-1>, <1-2>, <2-3>]
+
+     see sample/listcap.c file.
+
+
+A-6. Problems
+
+   + Invalid encoding byte sequence is not checked in UTF-8.
+
+     * Invalid first byte is treated as a character.
+       /./u =~ "\xa3"
+
+     * Incomplete byte sequence is not checked.
+       /\w+/ =~ "a\xf3\x8ec"
+
+// END
diff --git a/ext/mbstring/oniguruma/doc/RE.ja b/ext/mbstring/oniguruma/doc/RE.ja
new file mode 100644
index 0000000000..51681715c4
--- /dev/null
+++ b/ext/mbstring/oniguruma/doc/RE.ja
@@ -0,0 +1,424 @@
+���� ����ɽ�� Version 4.3.0    2006/08/17
+
+����ʸˡ: ONIG_SYNTAX_RUBY (������)
+
+
+1. ��������
+
+  \       ���򽤾� (����������)  ����ɽ�������ͭ��/̵��������
+  |       �����
+  (...)   ������   (���롼��)
+  [...]   ʸ������ (ʸ�����饹)
+
+
+2. ʸ��
+
+  \t           ��ʿ����         (0x09)
+  \v           ��ľ����         (0x0B)
+  \n           ����             (0x0A)
+  \r           ����             (0x0D)
+  \b           �������         (0x08)
+  \f           ����             (0x0C)
+  \a           ��               (0x07)
+  \e           ���򽤾�         (0x1B)
+  \nnn         Ȭ�ʿ�ɽ��        ��沽�Х�����(�ΰ���)
+  \xHH         ��ϻ�ʿ�ɽ��      ��沽�Х�����(�ΰ���)
+  \x{7HHHHHHH} ��ĥ��ϻ�ʿ�ɽ��  �����ɥݥ������
+  \cx          ����ʸ��ɽ��      �����ɥݥ������
+  \C-x         ����ʸ��ɽ��      �����ɥݥ������
+  \M-x         Ķ  (x|0x80)      �����ɥݥ������
+  \M-\C-x      Ķ + ����ʸ��ɽ�� �����ɥݥ������
+
+  �� \b�ϡ�ʸ��������ǤΤ�ͭ��
+
+
+3. ʸ����
+
+  .        Ǥ��ʸ�� (���Ԥ����)
+
+  \w       ñ�칽��ʸ��
+
+           Unicode�ʳ��ξ��:
+             �ѿ���, "_" ����� ¿�Х���ʸ����
+
+           Unicode�ξ��:
+             General_Category -- (Letter|Mark|Number|Connector_Punctuation)
+
+  \W       ��ñ�칽��ʸ��
+
+  \s       ����ʸ��
+
+           Unicode�ʳ��ξ��:
+             \t, \n, \v, \f, \r, \x20
+
+           Unicode�ξ��:
+             0009, 000A, 000B, 000C, 000D, 0085(NEL), 
+             General_Category -- Line_Separator
+                              -- Paragraph_Separator
+                              -- Space_Separator
+
+  \S       �����ʸ��
+
+  \d       10�ʿ���
+
+           Unicode�ξ��: General_Category -- Decimal_Number
+
+  \D       ��10�ʿ���
+
+  \h       16�ʿ���    [0-9a-fA-F]
+
+  \H       ��16�ʿ���
+
+
+
+4. �̻����
+
+  ��ĥ��
+
+    ?       ���ޤ�������
+    *       ����ʾ�
+    +       ���ʾ�
+    {n,m}   n��ʾ�m��ʲ�
+    {n,}    n��ʾ�
+    {,n}    ����ʾ�n��ʲ� ({0,n})
+    {n}     n��
+
+  ̵��
+
+    ??      ���ޤ�������
+    *?      ����ʾ�
+    +?      ���ʾ�
+    {n,m}?  n��ʾ�m��ʲ�
+    {n,}?   n��ʾ�
+    {,n}?   ����ʾ�n��ʲ� (== {0,n}?)
+
+  ���� (��ĥ��ǡ������֤�������������ϲ���򸺤餹�褦�ʸ���ƻ�Ԥ򤷤ʤ�)
+
+    ?+      ���ޤ�������
+    *+      ����ʾ�
+    ++      ���ʾ�
+
+    ({n,m}+, {n,}+, {n}+ �ϡ�ONIG_SYNTAX_JAVA�ǤΤ߶��ߤʻ����)
+
+    ��. /a*+/ === /(?>a*)/
+
+
+5. ��
+
+  ^       ��Ƭ
+  $       ����
+  \b      ñ�춭��
+  \B      ��ñ�춭��
+  \A      ʸ������Ƭ
+  \Z      ʸ�����������ޤ���ʸ���������β��Ԥ�ľ��
+  \z      ʸ��������
+  \G      �ȹ糫�ϰ���(*)
+
+          * Ruby Regexp:
+                 ����ȹ�������������
+                (���λ��ͤ�Ruby�μ����˴ؤ����ΤǤ��ꡢ
+                 ����ɽ���饤�֥��Ȥ�̵�ط�)
+
+
+6. ʸ������
+
+  ^...    ����   (����ͥ���ٱ黻��)
+  x-y     �ϰ�   (x����y�ޤ�)
+  [...]   ����   (ʸ��������ʸ������)
+  ..&&..  �ѱ黻 (^�μ���ͥ���٤��㤤�黻��)
+
+     ��. [a-w&&[^c-g]z] ==> ([a-w] and ([^c-g] or z)) ==> [abh-w]
+
+  �� '[', '-', ']'��ʸ����������̾�ʸ���ΰ�̣�ǻ��Ѥ��������ˤϡ�
+     ������ʸ����'\'�����򽤾����ʤ���Фʤ�ʤ���
+
+
+  POSIX�֥饱�å� ([:xxxxx:], ���� [:^xxxxx:])
+
+    Unicode�ʳ��ξ��:
+
+    alnum    �ѿ���
+    alpha    �ѻ�
+    ascii    0 - 127
+    blank    \t, \x20
+    cntrl
+    digit    0-9
+    graph    ¿�Х���ʸ��������ޤ�
+    lower
+    print    ¿�Х���ʸ��������ޤ�
+    punct
+    space    \t, \n, \v, \f, \r, \x20
+    upper
+    xdigit   0-9, a-f, A-F
+
+    Unicode�ξ��:
+
+    alnum    Letter | Mark | Decimal_Number
+    alpha    Letter | Mark
+    ascii    0000 - 007F
+    blank    Space_Separator | 0009
+    cntrl    Control | Format | Unassigned | Private_Use | Surrogate
+    digit    Decimal_Number
+    graph    [[:^space:]] && ^Control && ^Unassigned && ^Surrogate
+    lower    Lowercase_Letter
+    print    [[:graph:]] | [[:space:]]
+    punct    Connector_Punctuation | Dash_Punctuation | Close_Punctuation |
+             Final_Punctuation | Initial_Punctuation | Other_Punctuation |
+             Open_Punctuation
+    space    Space_Separator | Line_Separator | Paragraph_Separator |
+             0009 | 000A | 000B | 000C | 000D | 0085
+    upper    Uppercase_Letter
+    xdigit   0030 - 0039 | 0041 - 0046 | 0061 - 0066
+             (0-9, a-f, A-F)
+
+
+7. ��ĥ������
+
+  (?#...)           ����
+  (?imx-imx)        ��Ω���ץ����
+                      i: ��ʸ����ʸ���ȹ�
+                      m: ʣ����
+                      x: ��ĥ����
+  (?imx-imx:��)     �����ץ����
+
+  (��)              ��ͼ�����
+  (?:��)            ����ͼ�����
+
+  (?=��)            ���ɤ�
+  (?!��)            �������ɤ�
+  (?<=��)           ����ɤ�
+  (?<!��)           ��������ɤ�
+
+                    ����ɤߤμ��ϸ���ʸ��Ĺ�Ǥʤ���Фʤ�ʤ���
+                    ���������Ǿ�̤�����Ҥ����ϰۤʤä�ʸ��Ĺ��������롣
+                    ��. (?<=a|bc) �ϵ���. (?<=aaa(?:b|cd)) ���Ե���
+
+                    ��������ɤߤǤϡ���ͼ�����ϵ�����ʤ�����
+                    ����ͼ�����ϵ�����롣
+
+  (?>��)            ����Ū������
+                    �����Τ��̲ᤷ���Ȥ���������Ǥθ���ƻ�Ԥ�Ԥʤ�ʤ�
+
+  (?<name>��)       ̾���դ���ͼ�����
+                    �������̾���������Ƥ�(�������)��
+                    (̾����ñ�칽��ʸ���Ǥʤ���Фʤ�ʤ����ǽ��ʸ����
+                     ����ʸ���Ǥ��äƤϤ����ʤ���)
+
+                    ̾�������Ǥʤ�����ͼ������Ʊ�ͤ��ֹ�������Ƥ��롣
+                    �ֹ���꤬�ػߤ���Ƥ��ʤ����� (10. ��ͼ����� �򻲾�)
+                    �ΤȤ��ϡ�̾����Ȥ�ʤ����ֹ�Ǥ⻲�ȤǤ��롣
+
+                    ʣ���μ������Ʊ��̾����Ϳ���뤳�Ȥϵ�����Ƥ��롣
+                    ���ξ��ˤϡ�����̾������Ѥ����������Ȥϲ�ǽ�Ǥ��뤬��
+                    ��ʬ���ƽФ��ϤǤ��ʤ���
+
+
+8. ��������
+
+  \n          �ֹ���껲�� (n >= 1)
+  \k<name>    ̾�����껲��
+
+  ̾�����껲�Ȥǡ�����̾����ʣ���μ������¿���������Ƥ�����ˤϡ�
+  �ֹ���礭�������礫��ͥ��Ū�˻��Ȥ���롣
+  (�ޥå����ʤ��Ȥ��ˤ��ֹ�ξ����������礬���Ȥ����)
+
+  �� �ֹ���껲�Ȥϡ�̾���դ���ͼ����礬������졢
+     ���� ONIG_OPTION_CAPTURE_GROUP�����ꤵ��Ƥ��ʤ����ˤϡ�
+     �ػߤ���롣(10. ��ͼ����� �򻲾�)
+
+
+  �ͥ��ȥ�٥��դ���������
+
+    ���ε�ǽ�ϸ��ߡ�Ruby 1.9�Ǥ�̵���ˤ��Ƥ��롣
+
+    \k<name+n>     n: 0, 1, 2, ...
+    \k<name-n>     n: 0, 1, 2, ...
+
+    �������Ȥΰ��֤�������Ū����ʬ���ƽФ��ͥ��ȥ�٥����ꤷ�ơ����Υ�٥�Ǥ�
+    ����ͤ򻲾Ȥ��롣
+
+    ��-1.
+
+      /\A(?<a>|.|(?:(?<b>.)\g<a>\k<b+0>))\z/.match("reer")
+
+    ��-2.
+
+      r = Regexp.compile(<<'__REGEXP__'.strip, Regexp::EXTENDED)
+      (?<element> \g<stag> \g<content>* \g<etag> ){0}
+      (?<stag> < \g<name> \s* > ){0}
+      (?<name> [a-zA-Z_:]+ ){0}
+      (?<content> [^<&]+ (\g<element> | [^<&]+)* ){0}
+      (?<etag> </ \k<name+1> >){0}
+      \g<element>
+      __REGEXP__
+
+      p r.match('<foo>f<bar>bbb</bar>f</foo>').captures
+
+
+
+9. ��ʬ���ƽФ� ("����ů���ڥ����")
+
+  \g<name>    ̾������ƽФ�
+  \g<n>       �ֹ����ƽФ� (n >= 1)
+
+  �� �Ǻ����֤ǤκƵ��ƽФ��϶ػߤ���롣
+     ��. (?<name>a|\g<name>b)   => error
+         (?<name>a|b\g<name>c)  => OK
+
+  �� �ֹ����ƽФ��ϡ�̾���դ���ͼ����礬������졢
+     ���� ONIG_OPTION_CAPTURE_GROUP�����ꤵ��Ƥ��ʤ����ˤϡ�
+     �ػߤ���롣 (10. ��ͼ����� �򻲾�)
+
+  �� �ƤӽФ��줿������Υ��ץ������֤��ƽФ�¦�Υ��ץ������֤ȰۤʤäƤ���
+     �Ȥ����ƤӽФ��줿¦�Υ��ץ������֤�ͭ���Ǥ��롣
+
+     ��. (?-i:\g<name>)(?i:(?<name>a)){0} �� "A" �˾ȹ��������롣
+
+
+10. ��ͼ�����
+
+  ��ͼ�����(...)�ϡ��ʲ��ξ��˱����ƿ����Ѳ����롣
+  (̾���դ���ͼ�������Ѳ����ʤ�)
+
+  case 1. /.../     (̾���դ���ͼ�������Ի��ѡ����ץ����ʤ�)
+
+     (...) �ϡ���ͼ�����Ȥ��ư����롣
+
+  case 2. /.../g    (̾���դ���ͼ�������Ի��ѡ����ץ���� 'g'�����)
+
+     (...) �ϡ�����ͼ�����Ȥ��ư����롣
+
+  case 3. /..(?<name>..)../   (̾���դ���ͼ�����ϻ��ѡ����ץ����ʤ�)
+
+     (...) �ϡ�����ͼ�����Ȥ��ư����롣
+     �ֹ���껲��/�ƤӽФ����Ե��ġ�
+
+  case 4. /..(?<name>..)../G  (̾���դ���ͼ�����ϻ��ѡ����ץ���� 'G'�����)
+
+     (...) �ϡ���ͼ�����Ȥ��ư����롣
+     �ֹ���껲��/�ƤӽФ��ϵ��ġ�
+
+  â��
+    g: ONIG_OPTION_DONT_CAPTURE_GROUP
+    G: ONIG_OPTION_CAPTURE_GROUP
+    ('g'��'G'���ץ����ϡ�ruby-dev ML�ǵ������줿��)
+
+  �����ο���ΰ�̣�ϡ�
+  ̾���դ���ͤ�̾��̵����ͤ�Ʊ���˻��Ѥ���ɬ�����Τ�����̤Ͼ��ʤ��Ǥ�����
+  �Ȥ�����ͳ����ͤ���줿��ΤǤ��롣
+  �����Υ��ץ����ˤĤ��Ƥϡ�Ruby�Ǥϸ��߼�������Ƥ��ʤ���
+
+
+-----------------------------
+�䵭 1. ʸˡ��¸���ץ����
+
+   + ONIG_SYNTAX_RUBY
+     (?m): �����䵭��(.)�ϲ��ԤȾȹ�����
+
+   + ONIG_SYNTAX_PERL �� ONIG_SYNTAX_JAVA
+     (?s): �����䵭��(.)�ϲ��ԤȾȹ�����
+     (?m): ^ �ϲ��Ԥ�ľ��˾ȹ礹�롢$ �ϲ��Ԥ�ľ���˾ȹ礹��
+
+
+�䵭 2. �ȼ���ĥ��ǽ
+
+   + 16�ʿ���������16�ʿ���  \h, \H
+   + ̾���դ���ͼ�����      (?<name>...)
+   + ̾�������������        \k<name>
+   + ��ʬ���ƽФ�            \g<name>, \g<group-num>
+
+
+�䵭 3. Perl 5.8.0����Ӥ���¸�ߤ��ʤ���ǽ
+
+   + [:word:]
+   + \N{name}
+   + \l,\u,\L,\U, \X, \C
+   + (?{code})
+   + (??{code})
+   + (?(condition)yes-pat|no-pat)
+
+   * \Q...\E
+     â��ONIG_SYNTAX_PERL��ONIG_SYNTAX_JAVA�Ǥ�ͭ��
+
+   * \p{property}, \P{property}
+     â��ONIG_SYNTAX_PERL��ONIG_SYNTAX_JAVA�Ǥ�ͭ��
+     Alnum, Alpha, Blank, Cntrl, Digit, Graph, Lower,
+     Print, Punct, Space, Upper, XDigit, ASCII������Ǥ��롣
+
+     ����̾������ 'Is'���ֻ����Ѥ��뤳�Ȥϡ�ONIG_SYNTAX_PERL�ǤΤ�
+     ������Ƥ��롣
+     ex. \p{IsXDigit}.
+
+     ����������黻�Ҥϡ�ONIG_SYNTAX_PERL�ǤΤߵ�����Ƥ��롣
+     \p{^...}, \P{^...}
+
+
+�䵭 4. Ruby�����ܸ첽 GNU regex(version 0.12)�Ȥΰ㤤
+
+   + 16�ʿ����������ɲ� (\h, \H)
+   + ����ɤߵ�ǽ���ɲ�
+   + ���ߤʷ����֤�����Ҥ��ɲ� (?+, *+, ++)
+   + ʸ���������α黻�Ҥ��ɲ� ([...], &&)
+     ('[' �ϡ�ʸ�����������̾��ʸ���Ȥ��ƻ��Ѥ���Ȥ��ˤ�
+      ���򽤾����ʤ���Фʤ�ʤ�)
+   + ̾���դ���ͼ�����ȡ���ʬ���ƽФ���ǽ�ɲ�
+   + ¿�Х���ʸ�������ɤ����ꤵ��Ƥ���Ȥ���
+     ʸ����������Ȭ�ʿ��ޤ��Ͻ�ϻ�ʿ�ɽ����Ϣ³�ϡ�¿�Х�������ɽ�����줿
+     ��Ĥ�ʸ���Ȳ�ᤵ���
+     (��. [\xa1\xa2], [\xa1\xa7-\xa4\xa1])
+   + ʸ���������ǡ���Х���ʸ����¿�Х���ʸ�����ϰϻ���ϵ�����롣
+     ex. /[a-��]/
+   + ��Ω���ץ�����ͭ���ϰϤϡ����θ�Ω���ץ�����ޤ�Ǥ��뼰�����
+     �����ޤǤǤ���
+     ��. (?:(?i)a|b) �� (?:(?i:a|b)) �Ȳ�ᤵ��롢(?:(?i:a)|b)�ǤϤʤ�
+   + ��Ω���ץ����Ϥ������μ����Ф���Ʃ��Ū�ǤϤʤ�
+     ��. /a(?i)*/ ��ʸˡ���顼�Ȥʤ�
+   + �Դ����ʷ����֤��ϰϻ���Ҥ��̾��ʸ����Ȥ��Ƶ��Ĥ����
+     ��. /{/, /({)/, /a{2,3/
+   + ����ŪPOSIX�֥饱�å� [:^xxxx:] ���ɲ�
+   + POSIX�֥饱�å� [:ascii:] ���ɲ�
+   + ���ɤߤη����֤����Ե���
+     ��. /(?=a)*/, /(?!b){5}/
+   + ���ͤǻ��ꤵ�줿ʸ�����Ф��Ƥ⡢��ʸ����ʸ���ȹ祪�ץ�����ͭ��
+     ��. /\x61/i =~ "A"
+   + �����֤��������ǡ��������ξ�ά(0��)���Ǥ���
+     /a{,n}/ == /a{0,n}/
+     �������Ⱥ�������Ʊ����ά�ϵ�����ʤ���(/a{,}/)
+   + /a{n}?/��̵�ߤʱ黻�ҤǤϤʤ���
+     /a{n}?/ == /(?:a{n})?/
+   + ̵���ʸ������Ȥ�����å����ƥ��顼�ˤ��롣
+     /\1/, /(a)\2/
+   + ̵�·����֤�����ǡ�Ĺ�����Ǥξȹ������Ϸ����֤������Ǥ����뤬��
+     ���ΤȤ������Ǥ��٤����ɤ�����Ƚ��Ȥ��ơ���ͼ��������;��֤�
+     �Ѳ��ޤǹ�θ���Ƥ���
+     /(?:()|())*\1\2/ =~ ""
+     /(?:\1a|())*/ =~ "a"
+
+
+
+�䵭 5. ��������Ƥ��뤬�������ͤǤ�ͭ���ˤ��Ƥ��ʤ���ǽ
+
+   + ������򻲾�
+
+     (?@...) �� (?@<name>...)
+
+     ��. /(?@a)*/.match("aaa") ==> [<0-1>, <1-2>, <2-3>]
+
+     ������ˡ�ϡ�sample/listcap.c�򻲾�
+
+     ͭ���ˤ��Ƥ��ʤ���ͳ�ϡ��ɤ��������Ω�Ĥ��Ϥä��ꤷ�ʤ����ᡣ
+
+
+�䵭 6. ������
+
+   + UTF-8�ǡ��Х����ͤ�Ŭ���ʲ����ɤ����Υ����å��ϹԤʤäƤ��ʤ���
+
+     * ��Ƭ�Х��ȤȤ��������ʥХ��Ȥ��ʸ���Ȥߤʤ�
+       /./u =~ "\xa3"
+
+     * �Դ����ʥХ��ȥ������󥹤Υ����å��򤷤ʤ�
+      /\w+/ =~ "a\xf3\x8ec"
+
+     �����Ĵ�٤뤳�Ȥϲ�ǽ�ǤϤ��뤬���٤��ʤ�ΤǹԤʤ�ʤ���
+
+����
author	Seiji Masugata <masugata@php.net>	2006-08-24 17:20:58 +0000
committer	Seiji Masugata <masugata@php.net>	2006-08-24 17:20:58 +0000
commit	99211d04442b5d92ceff94ccd01e6b57ef23f796 (patch)
tree	027f88310c759c71833c140765b0f90691b9e04f /ext/mbstring/oniguruma/doc
parent	74685a184f4b001d608911aa0c7a3cba11eb8fe7 (diff)
download	php-git-99211d04442b5d92ceff94ccd01e6b57ef23f796.tar.gz