1 #ifndef ONIGURUMA_H
2 #define ONIGURUMA_H
3 /**********************************************************************
4   oniguruma.h - Oniguruma (regular expression library)
5 **********************************************************************/
6 /*-
7  * Copyright (c) 2002-2021  K.Kosako
8  * All rights reserved.
9  *
10  * Redistribution and use in source and binary forms, with or without
11  * modification, are permitted provided that the following conditions
12  * are met:
13  * 1. Redistributions of source code must retain the above copyright
14  *    notice, this list of conditions and the following disclaimer.
15  * 2. Redistributions in binary form must reproduce the above copyright
16  *    notice, this list of conditions and the following disclaimer in the
17  *    documentation and/or other materials provided with the distribution.
18  *
19  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
20  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
21  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
22  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
23  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
24  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
25  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
26  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
27  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
28  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
29  * SUCH DAMAGE.
30  */
31 
32 #ifdef __cplusplus
33 extern "C" {
34 #endif
35 
36 #define ONIGURUMA
37 #define ONIGURUMA_VERSION_MAJOR   6
38 #define ONIGURUMA_VERSION_MINOR   9
39 #define ONIGURUMA_VERSION_TEENY   7
40 
41 #define ONIGURUMA_VERSION_INT     60907
42 
43 #ifndef P_
44 #if defined(__STDC__) || defined(_WIN32)
45 # define P_(args) args
46 #else
47 # define P_(args) ()
48 #endif
49 #endif
50 
51 #ifndef PV_
52 # define PV_(args) args
53 #endif
54 
55 #ifndef ONIG_STATIC
56 #ifndef ONIG_EXTERN
57 #if defined(_WIN32) && !defined(__GNUC__)
58 #if defined(ONIGURUMA_EXPORT)
59 #define ONIG_EXTERN   extern __declspec(dllexport)
60 #else
61 #define ONIG_EXTERN   extern __declspec(dllimport)
62 #endif
63 #endif
64 #endif
65 
66 #ifndef ONIG_EXTERN
67 #define ONIG_EXTERN   extern
68 #endif
69 #else
70 #define ONIG_EXTERN   extern
71 #endif
72 
73 #ifndef ONIG_VARIADIC_FUNC_ATTR
74 #define ONIG_VARIADIC_FUNC_ATTR
75 #endif
76 
77 /* PART: character encoding */
78 
79 #ifndef ONIG_ESCAPE_UCHAR_COLLISION
80 #define UChar OnigUChar
81 #endif
82 
83 typedef unsigned int   OnigCodePoint;
84 typedef unsigned char  OnigUChar;
85 typedef unsigned int   OnigCtype;
86 typedef unsigned int   OnigLen;
87 
88 #define ONIG_INFINITE_DISTANCE  ~((OnigLen )0)
89 
90 typedef unsigned int OnigCaseFoldType; /* case fold flag */
91 
92 ONIG_EXTERN OnigCaseFoldType OnigDefaultCaseFoldFlag;
93 
94 #define ONIGENC_CASE_FOLD_ASCII_ONLY            (1)
95 /* #define ONIGENC_CASE_FOLD_HIRAGANA_KATAKANA  (1<<1) */
96 /* #define ONIGENC_CASE_FOLD_KATAKANA_WIDTH     (1<<2) */
97 #define ONIGENC_CASE_FOLD_TURKISH_AZERI         (1<<20)
98 #define INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR   (1<<30)
99 
100 #define ONIGENC_CASE_FOLD_MIN      INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR
101 #define ONIGENC_CASE_FOLD_DEFAULT  OnigDefaultCaseFoldFlag
102 
103 
104 #define ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN       3
105 #define ONIGENC_GET_CASE_FOLD_CODES_MAX_NUM      13
106 /* 13 => Unicode:0x1ffc */
107 
108 /* code range */
109 #define ONIGENC_CODE_RANGE_NUM(range)     ((int )range[0])
110 #define ONIGENC_CODE_RANGE_FROM(range,i)  range[((i)*2) + 1]
111 #define ONIGENC_CODE_RANGE_TO(range,i)    range[((i)*2) + 2]
112 
113 typedef struct {
114   int byte_len;  /* argument(original) character(s) byte length */
115   int code_len;  /* number of code */
116   OnigCodePoint code[ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN];
117 } OnigCaseFoldCodeItem;
118 
119 typedef struct {
120   OnigCodePoint esc;
121   OnigCodePoint anychar;
122   OnigCodePoint anytime;
123   OnigCodePoint zero_or_one_time;
124   OnigCodePoint one_or_more_time;
125   OnigCodePoint anychar_anytime;
126 } OnigMetaCharTableType;
127 
128 typedef int (*OnigApplyAllCaseFoldFunc)(OnigCodePoint from, OnigCodePoint* to, int to_len, void* arg);
129 
130 typedef struct OnigEncodingTypeST {
131   int    (*mbc_enc_len)(const OnigUChar* p);
132   const char*   name;
133   int           max_enc_len;
134   int           min_enc_len;
135   int    (*is_mbc_newline)(const OnigUChar* p, const OnigUChar* end);
136   OnigCodePoint (*mbc_to_code)(const OnigUChar* p, const OnigUChar* end);
137   int    (*code_to_mbclen)(OnigCodePoint code);
138   int    (*code_to_mbc)(OnigCodePoint code, OnigUChar *buf);
139   int    (*mbc_case_fold)(OnigCaseFoldType flag, const OnigUChar** pp, const OnigUChar* end, OnigUChar* to);
140   int    (*apply_all_case_fold)(OnigCaseFoldType flag, OnigApplyAllCaseFoldFunc f, void* arg);
141   int    (*get_case_fold_codes_by_str)(OnigCaseFoldType flag, const OnigUChar* p, const OnigUChar* end, OnigCaseFoldCodeItem acs[]);
142   int    (*property_name_to_ctype)(struct OnigEncodingTypeST* enc, OnigUChar* p, OnigUChar* end);
143   int    (*is_code_ctype)(OnigCodePoint code, OnigCtype ctype);
144   int    (*get_ctype_code_range)(OnigCtype ctype, OnigCodePoint* sb_out, const OnigCodePoint* ranges[]);
145   OnigUChar* (*left_adjust_char_head)(const OnigUChar* start, const OnigUChar* p);
146   int    (*is_allowed_reverse_match)(const OnigUChar* p, const OnigUChar* end);
147   int    (*init)(void);
148   int    (*is_initialized)(void);
149   int    (*is_valid_mbc_string)(const OnigUChar* s, const OnigUChar* end);
150   unsigned int flag;
151   OnigCodePoint sb_range;
152   int index;
153 } OnigEncodingType;
154 
155 typedef OnigEncodingType* OnigEncoding;
156 
157 ONIG_EXTERN OnigEncodingType OnigEncodingASCII;
158 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_1;
159 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_2;
160 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_3;
161 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_4;
162 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_5;
163 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_6;
164 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_7;
165 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_8;
166 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_9;
167 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_10;
168 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_11;
169 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_13;
170 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_14;
171 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_15;
172 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_16;
173 ONIG_EXTERN OnigEncodingType OnigEncodingUTF8;
174 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_BE;
175 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_LE;
176 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_BE;
177 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_LE;
178 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_JP;
179 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_TW;
180 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_KR;
181 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_CN;
182 ONIG_EXTERN OnigEncodingType OnigEncodingSJIS;
183 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8;
184 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8_R;
185 ONIG_EXTERN OnigEncodingType OnigEncodingCP1251;
186 ONIG_EXTERN OnigEncodingType OnigEncodingBIG5;
187 ONIG_EXTERN OnigEncodingType OnigEncodingGB18030;
188 
189 #define ONIG_ENCODING_ASCII        (&OnigEncodingASCII)
190 #define ONIG_ENCODING_ISO_8859_1   (&OnigEncodingISO_8859_1)
191 #define ONIG_ENCODING_ISO_8859_2   (&OnigEncodingISO_8859_2)
192 #define ONIG_ENCODING_ISO_8859_3   (&OnigEncodingISO_8859_3)
193 #define ONIG_ENCODING_ISO_8859_4   (&OnigEncodingISO_8859_4)
194 #define ONIG_ENCODING_ISO_8859_5   (&OnigEncodingISO_8859_5)
195 #define ONIG_ENCODING_ISO_8859_6   (&OnigEncodingISO_8859_6)
196 #define ONIG_ENCODING_ISO_8859_7   (&OnigEncodingISO_8859_7)
197 #define ONIG_ENCODING_ISO_8859_8   (&OnigEncodingISO_8859_8)
198 #define ONIG_ENCODING_ISO_8859_9   (&OnigEncodingISO_8859_9)
199 #define ONIG_ENCODING_ISO_8859_10  (&OnigEncodingISO_8859_10)
200 #define ONIG_ENCODING_ISO_8859_11  (&OnigEncodingISO_8859_11)
201 #define ONIG_ENCODING_ISO_8859_13  (&OnigEncodingISO_8859_13)
202 #define ONIG_ENCODING_ISO_8859_14  (&OnigEncodingISO_8859_14)
203 #define ONIG_ENCODING_ISO_8859_15  (&OnigEncodingISO_8859_15)
204 #define ONIG_ENCODING_ISO_8859_16  (&OnigEncodingISO_8859_16)
205 #define ONIG_ENCODING_UTF8         (&OnigEncodingUTF8)
206 #define ONIG_ENCODING_UTF16_BE     (&OnigEncodingUTF16_BE)
207 #define ONIG_ENCODING_UTF16_LE     (&OnigEncodingUTF16_LE)
208 #define ONIG_ENCODING_UTF32_BE     (&OnigEncodingUTF32_BE)
209 #define ONIG_ENCODING_UTF32_LE     (&OnigEncodingUTF32_LE)
210 #define ONIG_ENCODING_EUC_JP       (&OnigEncodingEUC_JP)
211 #define ONIG_ENCODING_EUC_TW       (&OnigEncodingEUC_TW)
212 #define ONIG_ENCODING_EUC_KR       (&OnigEncodingEUC_KR)
213 #define ONIG_ENCODING_EUC_CN       (&OnigEncodingEUC_CN)
214 #define ONIG_ENCODING_SJIS         (&OnigEncodingSJIS)
215 #define ONIG_ENCODING_KOI8         (&OnigEncodingKOI8)
216 #define ONIG_ENCODING_KOI8_R       (&OnigEncodingKOI8_R)
217 #define ONIG_ENCODING_CP1251       (&OnigEncodingCP1251)
218 #define ONIG_ENCODING_BIG5         (&OnigEncodingBIG5)
219 #define ONIG_ENCODING_GB18030      (&OnigEncodingGB18030)
220 
221 #define ONIG_ENCODING_UNDEF    ((OnigEncoding )0)
222 
223 
224 /* work size */
225 #define ONIGENC_CODE_TO_MBC_MAXLEN       7
226 #define ONIGENC_MBC_CASE_FOLD_MAXLEN    18
227 /* 18: 6(max-byte) * 3(case-fold chars) */
228 
229 /* character types */
230 typedef enum {
231   ONIGENC_CTYPE_NEWLINE = 0,
232   ONIGENC_CTYPE_ALPHA   = 1,
233   ONIGENC_CTYPE_BLANK   = 2,
234   ONIGENC_CTYPE_CNTRL   = 3,
235   ONIGENC_CTYPE_DIGIT   = 4,
236   ONIGENC_CTYPE_GRAPH   = 5,
237   ONIGENC_CTYPE_LOWER   = 6,
238   ONIGENC_CTYPE_PRINT   = 7,
239   ONIGENC_CTYPE_PUNCT   = 8,
240   ONIGENC_CTYPE_SPACE   = 9,
241   ONIGENC_CTYPE_UPPER   = 10,
242   ONIGENC_CTYPE_XDIGIT  = 11,
243   ONIGENC_CTYPE_WORD    = 12,
244   ONIGENC_CTYPE_ALNUM   = 13,  /* alpha || digit */
245   ONIGENC_CTYPE_ASCII   = 14
246 } OnigEncCtype;
247 
248 #define ONIGENC_MAX_STD_CTYPE  ONIGENC_CTYPE_ASCII
249 
250 
251 #define onig_enc_len(enc,p,end)        ONIGENC_MBC_ENC_LEN(enc,p)
252 
253 #define ONIGENC_IS_UNDEF(enc)          ((enc) == ONIG_ENCODING_UNDEF)
254 #define ONIGENC_IS_SINGLEBYTE(enc)     (ONIGENC_MBC_MAXLEN(enc) == 1)
255 #define ONIGENC_IS_MBC_HEAD(enc,p)     (ONIGENC_MBC_ENC_LEN(enc,p) != 1)
256 #define ONIGENC_IS_MBC_ASCII(p)           (*(p)   < 128)
257 #define ONIGENC_IS_CODE_ASCII(code)       ((code) < 128)
258 #define ONIGENC_IS_MBC_WORD(enc,s,end) \
259    ONIGENC_IS_CODE_WORD(enc,ONIGENC_MBC_TO_CODE(enc,s,end))
260 #define ONIGENC_IS_MBC_WORD_ASCII(enc,s,end) onigenc_is_mbc_word_ascii(enc,s,end)
261 
262 #define ONIGENC_NAME(enc)                      ((enc)->name)
263 
264 #define ONIGENC_MBC_CASE_FOLD(enc,flag,pp,end,buf) \
265   (enc)->mbc_case_fold(flag,(const OnigUChar** )pp,end,buf)
266 #define ONIGENC_IS_ALLOWED_REVERSE_MATCH(enc,s,end) \
267         (enc)->is_allowed_reverse_match(s,end)
268 #define ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc,start,s) \
269         (enc)->left_adjust_char_head(start, s)
270 #define ONIGENC_IS_VALID_MBC_STRING(enc,s,end) \
271         (enc)->is_valid_mbc_string(s,end)
272 #define ONIGENC_APPLY_ALL_CASE_FOLD(enc,case_fold_flag,f,arg) \
273         (enc)->apply_all_case_fold(case_fold_flag,f,arg)
274 #define ONIGENC_GET_CASE_FOLD_CODES_BY_STR(enc,case_fold_flag,p,end,acs) \
275        (enc)->get_case_fold_codes_by_str(case_fold_flag,p,end,acs)
276 #define ONIGENC_STEP_BACK(enc,start,s,n) \
277         onigenc_step_back((enc),(start),(s),(n))
278 
279 #define ONIGENC_MBC_ENC_LEN(enc,p)             (enc)->mbc_enc_len(p)
280 #define ONIGENC_MBC_MAXLEN(enc)               ((enc)->max_enc_len)
281 #define ONIGENC_MBC_MAXLEN_DIST(enc)           ONIGENC_MBC_MAXLEN(enc)
282 #define ONIGENC_MBC_MINLEN(enc)               ((enc)->min_enc_len)
283 #define ONIGENC_IS_MBC_NEWLINE(enc,p,end)      (enc)->is_mbc_newline((p),(end))
284 #define ONIGENC_MBC_TO_CODE(enc,p,end)         (enc)->mbc_to_code((p),(end))
285 #define ONIGENC_CODE_TO_MBCLEN(enc,code)       (enc)->code_to_mbclen(code)
286 #define ONIGENC_CODE_TO_MBC(enc,code,buf)      (enc)->code_to_mbc(code,buf)
287 #define ONIGENC_PROPERTY_NAME_TO_CTYPE(enc,p,end) \
288   (enc)->property_name_to_ctype(enc,p,end)
289 
290 #define ONIGENC_IS_CODE_CTYPE(enc,code,ctype)  (enc)->is_code_ctype(code,ctype)
291 
292 #define ONIGENC_IS_CODE_NEWLINE(enc,code) \
293         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_NEWLINE)
294 #define ONIGENC_IS_CODE_GRAPH(enc,code) \
295         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_GRAPH)
296 #define ONIGENC_IS_CODE_PRINT(enc,code) \
297         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PRINT)
298 #define ONIGENC_IS_CODE_ALNUM(enc,code) \
299         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALNUM)
300 #define ONIGENC_IS_CODE_ALPHA(enc,code) \
301         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALPHA)
302 #define ONIGENC_IS_CODE_LOWER(enc,code) \
303         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_LOWER)
304 #define ONIGENC_IS_CODE_UPPER(enc,code) \
305         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_UPPER)
306 #define ONIGENC_IS_CODE_CNTRL(enc,code) \
307         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_CNTRL)
308 #define ONIGENC_IS_CODE_PUNCT(enc,code) \
309         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PUNCT)
310 #define ONIGENC_IS_CODE_SPACE(enc,code) \
311         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_SPACE)
312 #define ONIGENC_IS_CODE_BLANK(enc,code) \
313         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_BLANK)
314 #define ONIGENC_IS_CODE_DIGIT(enc,code) \
315         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_DIGIT)
316 #define ONIGENC_IS_CODE_XDIGIT(enc,code) \
317         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_XDIGIT)
318 #define ONIGENC_IS_CODE_WORD(enc,code) \
319         ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_WORD)
320 
321 #define ONIGENC_GET_CTYPE_CODE_RANGE(enc,ctype,sbout,ranges) \
322         (enc)->get_ctype_code_range(ctype,sbout,ranges)
323 
324 ONIG_EXTERN
325 OnigUChar* onigenc_step_back P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, int n));
326 
327 
328 /* encoding API */
329 ONIG_EXTERN
330 int onigenc_init P_((void));
331 ONIG_EXTERN
332 int onig_initialize_encoding P_((OnigEncoding enc));
333 ONIG_EXTERN
334 int onigenc_set_default_encoding P_((OnigEncoding enc));
335 ONIG_EXTERN
336 OnigEncoding onigenc_get_default_encoding P_((void));
337 ONIG_EXTERN
338 void  onigenc_set_default_caseconv_table P_((const OnigUChar* table));
339 ONIG_EXTERN
340 OnigUChar* onigenc_get_right_adjust_char_head_with_prev P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, const OnigUChar** prev));
341 ONIG_EXTERN
342 OnigUChar* onigenc_get_prev_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
343 ONIG_EXTERN
344 OnigUChar* onigenc_get_left_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
345 ONIG_EXTERN
346 OnigUChar* onigenc_get_right_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
347 ONIG_EXTERN
348 int onigenc_strlen P_((OnigEncoding enc, const OnigUChar* p, const OnigUChar* end));
349 ONIG_EXTERN
350 int onigenc_strlen_null P_((OnigEncoding enc, const OnigUChar* p));
351 ONIG_EXTERN
352 int onigenc_str_bytelen_null P_((OnigEncoding enc, const OnigUChar* p));
353 ONIG_EXTERN
354 int onigenc_is_valid_mbc_string P_((OnigEncoding enc, const OnigUChar* s, const OnigUChar* end));
355 ONIG_EXTERN
356 OnigUChar* onigenc_strdup P_((OnigEncoding enc, const OnigUChar* s, const OnigUChar* end));
357 
358 
359 /* PART: regular expression */
360 
361 /* config parameters */
362 #define ONIG_NREGION                          10
363 #define ONIG_MAX_CAPTURE_NUM          2147483647  /* 2**31 - 1 */
364 #define ONIG_MAX_BACKREF_NUM                1000
365 #define ONIG_MAX_REPEAT_NUM               100000
366 #define ONIG_MAX_MULTI_BYTE_RANGES_NUM     10000
367 /* constants */
368 #define ONIG_MAX_ERROR_MESSAGE_LEN            90
369 
370 typedef unsigned int        OnigOptionType;
371 
372 #define ONIG_OPTION_DEFAULT            ONIG_OPTION_NONE
373 
374 /* options */
375 #define ONIG_OPTION_NONE                 0U
376 /* options (compile time) */
377 #define ONIG_OPTION_IGNORECASE           1U
378 #define ONIG_OPTION_EXTEND               (ONIG_OPTION_IGNORECASE         << 1)
379 #define ONIG_OPTION_MULTILINE            (ONIG_OPTION_EXTEND             << 1)
380 #define ONIG_OPTION_SINGLELINE           (ONIG_OPTION_MULTILINE          << 1)
381 #define ONIG_OPTION_FIND_LONGEST         (ONIG_OPTION_SINGLELINE         << 1)
382 #define ONIG_OPTION_FIND_NOT_EMPTY       (ONIG_OPTION_FIND_LONGEST       << 1)
383 #define ONIG_OPTION_NEGATE_SINGLELINE    (ONIG_OPTION_FIND_NOT_EMPTY     << 1)
384 #define ONIG_OPTION_DONT_CAPTURE_GROUP   (ONIG_OPTION_NEGATE_SINGLELINE  << 1)
385 #define ONIG_OPTION_CAPTURE_GROUP        (ONIG_OPTION_DONT_CAPTURE_GROUP << 1)
386 /* options (search time) */
387 #define ONIG_OPTION_NOTBOL                    (ONIG_OPTION_CAPTURE_GROUP << 1)
388 #define ONIG_OPTION_NOTEOL                    (ONIG_OPTION_NOTBOL << 1)
389 #define ONIG_OPTION_POSIX_REGION              (ONIG_OPTION_NOTEOL << 1)
390 #define ONIG_OPTION_CHECK_VALIDITY_OF_STRING  (ONIG_OPTION_POSIX_REGION << 1)
391 /* options (compile time) */
392 #define ONIG_OPTION_IGNORECASE_IS_ASCII  (ONIG_OPTION_CHECK_VALIDITY_OF_STRING << 3)
393 #define ONIG_OPTION_WORD_IS_ASCII        (ONIG_OPTION_IGNORECASE_IS_ASCII << 1)
394 #define ONIG_OPTION_DIGIT_IS_ASCII       (ONIG_OPTION_WORD_IS_ASCII << 1)
395 #define ONIG_OPTION_SPACE_IS_ASCII       (ONIG_OPTION_DIGIT_IS_ASCII << 1)
396 #define ONIG_OPTION_POSIX_IS_ASCII       (ONIG_OPTION_SPACE_IS_ASCII << 1)
397 #define ONIG_OPTION_TEXT_SEGMENT_EXTENDED_GRAPHEME_CLUSTER  (ONIG_OPTION_POSIX_IS_ASCII << 1)
398 #define ONIG_OPTION_TEXT_SEGMENT_WORD    (ONIG_OPTION_TEXT_SEGMENT_EXTENDED_GRAPHEME_CLUSTER << 1)
399 /* options (search time) */
400 #define ONIG_OPTION_NOT_BEGIN_STRING     (ONIG_OPTION_TEXT_SEGMENT_WORD << 1)
401 #define ONIG_OPTION_NOT_END_STRING       (ONIG_OPTION_NOT_BEGIN_STRING << 1)
402 #define ONIG_OPTION_NOT_BEGIN_POSITION   (ONIG_OPTION_NOT_END_STRING << 1)
403 #define ONIG_OPTION_CALLBACK_EACH_MATCH  (ONIG_OPTION_NOT_BEGIN_POSITION << 1)
404 
405 #define ONIG_OPTION_MAXBIT               ONIG_OPTION_CALLBACK_EACH_MATCH
406 
407 #define ONIG_OPTION_ON(options,regopt)      ((options) |= (regopt))
408 #define ONIG_OPTION_OFF(options,regopt)     ((options) &= ~(regopt))
409 #define ONIG_IS_OPTION_ON(options,option)   ((options) & (option))
410 
411 /* syntax */
412 typedef struct {
413   unsigned int   op;
414   unsigned int   op2;
415   unsigned int   behavior;
416   OnigOptionType options;   /* default option */
417   OnigMetaCharTableType meta_char_table;
418 } OnigSyntaxType;
419 
420 ONIG_EXTERN OnigSyntaxType OnigSyntaxASIS;
421 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixBasic;
422 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixExtended;
423 ONIG_EXTERN OnigSyntaxType OnigSyntaxEmacs;
424 ONIG_EXTERN OnigSyntaxType OnigSyntaxGrep;
425 ONIG_EXTERN OnigSyntaxType OnigSyntaxGnuRegex;
426 ONIG_EXTERN OnigSyntaxType OnigSyntaxJava;
427 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl;
428 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl_NG;
429 ONIG_EXTERN OnigSyntaxType OnigSyntaxRuby;
430 ONIG_EXTERN OnigSyntaxType OnigSyntaxPython;
431 ONIG_EXTERN OnigSyntaxType OnigSyntaxOniguruma;
432 
433 /* predefined syntaxes (see regsyntax.c) */
434 #define ONIG_SYNTAX_ASIS               (&OnigSyntaxASIS)
435 #define ONIG_SYNTAX_POSIX_BASIC        (&OnigSyntaxPosixBasic)
436 #define ONIG_SYNTAX_POSIX_EXTENDED     (&OnigSyntaxPosixExtended)
437 #define ONIG_SYNTAX_EMACS              (&OnigSyntaxEmacs)
438 #define ONIG_SYNTAX_GREP               (&OnigSyntaxGrep)
439 #define ONIG_SYNTAX_GNU_REGEX          (&OnigSyntaxGnuRegex)
440 #define ONIG_SYNTAX_JAVA               (&OnigSyntaxJava)
441 #define ONIG_SYNTAX_PERL               (&OnigSyntaxPerl)
442 #define ONIG_SYNTAX_PERL_NG            (&OnigSyntaxPerl_NG)
443 #define ONIG_SYNTAX_RUBY               (&OnigSyntaxRuby)
444 #define ONIG_SYNTAX_PYTHON             (&OnigSyntaxPython)
445 #define ONIG_SYNTAX_ONIGURUMA          (&OnigSyntaxOniguruma)
446 
447 /* default syntax */
448 ONIG_EXTERN OnigSyntaxType*   OnigDefaultSyntax;
449 #define ONIG_SYNTAX_DEFAULT   OnigDefaultSyntax
450 
451 /* syntax (operators) */
452 #define ONIG_SYN_OP_VARIABLE_META_CHARACTERS    (1U<<0)
453 #define ONIG_SYN_OP_DOT_ANYCHAR                 (1U<<1)   /* . */
454 #define ONIG_SYN_OP_ASTERISK_ZERO_INF           (1U<<2)   /* * */
455 #define ONIG_SYN_OP_ESC_ASTERISK_ZERO_INF       (1U<<3)
456 #define ONIG_SYN_OP_PLUS_ONE_INF                (1U<<4)   /* + */
457 #define ONIG_SYN_OP_ESC_PLUS_ONE_INF            (1U<<5)
458 #define ONIG_SYN_OP_QMARK_ZERO_ONE              (1U<<6)   /* ? */
459 #define ONIG_SYN_OP_ESC_QMARK_ZERO_ONE          (1U<<7)
460 #define ONIG_SYN_OP_BRACE_INTERVAL              (1U<<8)   /* {lower,upper} */
461 #define ONIG_SYN_OP_ESC_BRACE_INTERVAL          (1U<<9)   /* \{lower,upper\} */
462 #define ONIG_SYN_OP_VBAR_ALT                    (1U<<10)   /* | */
463 #define ONIG_SYN_OP_ESC_VBAR_ALT                (1U<<11)  /* \| */
464 #define ONIG_SYN_OP_LPAREN_SUBEXP               (1U<<12)  /* (...)   */
465 #define ONIG_SYN_OP_ESC_LPAREN_SUBEXP           (1U<<13)  /* \(...\) */
466 #define ONIG_SYN_OP_ESC_AZ_BUF_ANCHOR           (1U<<14)  /* \A, \Z, \z */
467 #define ONIG_SYN_OP_ESC_CAPITAL_G_BEGIN_ANCHOR  (1U<<15)  /* \G     */
468 #define ONIG_SYN_OP_DECIMAL_BACKREF             (1U<<16)  /* \num   */
469 #define ONIG_SYN_OP_BRACKET_CC                  (1U<<17)  /* [...]  */
470 #define ONIG_SYN_OP_ESC_W_WORD                  (1U<<18)  /* \w, \W */
471 #define ONIG_SYN_OP_ESC_LTGT_WORD_BEGIN_END     (1U<<19)  /* \<. \> */
472 #define ONIG_SYN_OP_ESC_B_WORD_BOUND            (1U<<20)  /* \b, \B */
473 #define ONIG_SYN_OP_ESC_S_WHITE_SPACE           (1U<<21)  /* \s, \S */
474 #define ONIG_SYN_OP_ESC_D_DIGIT                 (1U<<22)  /* \d, \D */
475 #define ONIG_SYN_OP_LINE_ANCHOR                 (1U<<23)  /* ^, $   */
476 #define ONIG_SYN_OP_POSIX_BRACKET               (1U<<24)  /* [:xxxx:] */
477 #define ONIG_SYN_OP_QMARK_NON_GREEDY            (1U<<25)  /* ??,*?,+?,{n,m}? */
478 #define ONIG_SYN_OP_ESC_CONTROL_CHARS           (1U<<26)  /* \n,\r,\t,\a ... */
479 #define ONIG_SYN_OP_ESC_C_CONTROL               (1U<<27)  /* \cx  */
480 #define ONIG_SYN_OP_ESC_OCTAL3                  (1U<<28)  /* \OOO */
481 #define ONIG_SYN_OP_ESC_X_HEX2                  (1U<<29)  /* \xHH */
482 #define ONIG_SYN_OP_ESC_X_BRACE_HEX8            (1U<<30)  /* \x{7HHHHHHH} */
483 #define ONIG_SYN_OP_ESC_O_BRACE_OCTAL           (1U<<31)  /* \o{1OOOOOOOOOO} */
484 
485 #define ONIG_SYN_OP2_ESC_CAPITAL_Q_QUOTE        (1U<<0)  /* \Q...\E */
486 #define ONIG_SYN_OP2_QMARK_GROUP_EFFECT         (1U<<1)  /* (?...) */
487 #define ONIG_SYN_OP2_OPTION_PERL                (1U<<2)  /* (?imsx),(?-imsx) */
488 #define ONIG_SYN_OP2_OPTION_RUBY                (1U<<3)  /* (?imx), (?-imx)  */
489 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_REPEAT     (1U<<4)  /* ?+,*+,++ */
490 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_INTERVAL   (1U<<5)  /* {n,m}+   */
491 #define ONIG_SYN_OP2_CCLASS_SET_OP              (1U<<6)  /* [...&&..[..]..] */
492 #define ONIG_SYN_OP2_QMARK_LT_NAMED_GROUP       (1U<<7)  /* (?<name>...) */
493 #define ONIG_SYN_OP2_ESC_K_NAMED_BACKREF        (1U<<8)  /* \k<name> */
494 #define ONIG_SYN_OP2_ESC_G_SUBEXP_CALL          (1U<<9)  /* \g<name>, \g<n> */
495 #define ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY     (1U<<10) /* (?@..),(?@<x>..) */
496 #define ONIG_SYN_OP2_ESC_CAPITAL_C_BAR_CONTROL  (1U<<11) /* \C-x */
497 #define ONIG_SYN_OP2_ESC_CAPITAL_M_BAR_META     (1U<<12) /* \M-x */
498 #define ONIG_SYN_OP2_ESC_V_VTAB                 (1U<<13) /* \v as VTAB */
499 #define ONIG_SYN_OP2_ESC_U_HEX4                 (1U<<14) /* \uHHHH */
500 #define ONIG_SYN_OP2_ESC_GNU_BUF_ANCHOR         (1U<<15) /* \`, \' */
501 #define ONIG_SYN_OP2_ESC_P_BRACE_CHAR_PROPERTY  (1U<<16) /* \p{...}, \P{...} */
502 #define ONIG_SYN_OP2_ESC_P_BRACE_CIRCUMFLEX_NOT (1U<<17) /* \p{^..}, \P{^..} */
503 /* #define ONIG_SYN_OP2_CHAR_PROPERTY_PREFIX_IS (1U<<18) */
504 #define ONIG_SYN_OP2_ESC_H_XDIGIT               (1U<<19) /* \h, \H */
505 #define ONIG_SYN_OP2_INEFFECTIVE_ESCAPE         (1U<<20) /* \ */
506 #define ONIG_SYN_OP2_QMARK_LPAREN_IF_ELSE       (1U<<21) /* (?(n)) (?(...)...|...) */
507 #define ONIG_SYN_OP2_ESC_CAPITAL_K_KEEP         (1U<<22) /* \K */
508 #define ONIG_SYN_OP2_ESC_CAPITAL_R_GENERAL_NEWLINE (1U<<23) /* \R \r\n else [\x0a-\x0d] */
509 #define ONIG_SYN_OP2_ESC_CAPITAL_N_O_SUPER_DOT  (1U<<24) /* \N (?-m:.), \O (?m:.) */
510 #define ONIG_SYN_OP2_QMARK_TILDE_ABSENT_GROUP   (1U<<25) /* (?~...) */
511 #define ONIG_SYN_OP2_ESC_X_Y_GRAPHEME_CLUSTER   (1U<<26) /* obsoleted: use next */
512 #define ONIG_SYN_OP2_ESC_X_Y_TEXT_SEGMENT       (1U<<26) /* \X \y \Y */
513 #define ONIG_SYN_OP2_QMARK_PERL_SUBEXP_CALL     (1U<<27) /* (?R), (?&name)... */
514 #define ONIG_SYN_OP2_QMARK_BRACE_CALLOUT_CONTENTS (1U<<28) /* (?{...}) (?{{...}}) */
515 #define ONIG_SYN_OP2_ASTERISK_CALLOUT_NAME      (1U<<29) /* (*name) (*name{a,..}) */
516 #define ONIG_SYN_OP2_OPTION_ONIGURUMA           (1U<<30) /* (?imxWDSPy) */
517 #define ONIG_SYN_OP2_QMARK_CAPITAL_P_NAME       (1U<<31) /* (?P<name>...) (?P=name) */
518 
519 /* syntax (behavior) */
520 #define ONIG_SYN_CONTEXT_INDEP_ANCHORS           (1U<<31) /* not implemented */
521 #define ONIG_SYN_CONTEXT_INDEP_REPEAT_OPS        (1U<<0)  /* ?, *, +, {n,m} */
522 #define ONIG_SYN_CONTEXT_INVALID_REPEAT_OPS      (1U<<1)  /* error or ignore */
523 #define ONIG_SYN_ALLOW_UNMATCHED_CLOSE_SUBEXP    (1U<<2)  /* ...)... */
524 #define ONIG_SYN_ALLOW_INVALID_INTERVAL          (1U<<3)  /* {??? */
525 #define ONIG_SYN_ALLOW_INTERVAL_LOW_ABBREV       (1U<<4)  /* {,n} => {0,n} */
526 #define ONIG_SYN_STRICT_CHECK_BACKREF            (1U<<5)  /* /(\1)/,/\1()/ ..*/
527 #define ONIG_SYN_DIFFERENT_LEN_ALT_LOOK_BEHIND   (1U<<6)  /* (?<=a|bc) */
528 #define ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP        (1U<<7)  /* see doc/RE */
529 #define ONIG_SYN_ALLOW_MULTIPLEX_DEFINITION_NAME (1U<<8)  /* (?<x>)(?<x>) */
530 #define ONIG_SYN_FIXED_INTERVAL_IS_GREEDY_ONLY   (1U<<9)  /* a{n}?=(?:a{n})? */
531 #define ONIG_SYN_ISOLATED_OPTION_CONTINUE_BRANCH (1U<<10) /* ..(?i)...|... */
532 #define ONIG_SYN_VARIABLE_LEN_LOOK_BEHIND        (1U<<11)  /* (?<=a+|..) */
533 #define ONIG_SYN_PYTHON                          (1U<<12)  /* \UHHHHHHHH */
534 
535 /* syntax (behavior) in char class [...] */
536 #define ONIG_SYN_NOT_NEWLINE_IN_NEGATIVE_CC      (1U<<20) /* [^...] */
537 #define ONIG_SYN_BACKSLASH_ESCAPE_IN_CC          (1U<<21) /* [..\w..] etc.. */
538 #define ONIG_SYN_ALLOW_EMPTY_RANGE_IN_CC         (1U<<22)
539 #define ONIG_SYN_ALLOW_DOUBLE_RANGE_OP_IN_CC     (1U<<23) /* [0-9-a]=[0-9\-a] */
540 #define ONIG_SYN_ALLOW_INVALID_CODE_END_OF_RANGE_IN_CC (1U<<26)
541 /* syntax (behavior) warning */
542 #define ONIG_SYN_WARN_CC_OP_NOT_ESCAPED          (1U<<24) /* [,-,] */
543 #define ONIG_SYN_WARN_REDUNDANT_NESTED_REPEAT    (1U<<25) /* (?:a*)+ */
544 
545 /* meta character specifiers (onig_set_meta_char()) */
546 #define ONIG_META_CHAR_ESCAPE               0
547 #define ONIG_META_CHAR_ANYCHAR              1
548 #define ONIG_META_CHAR_ANYTIME              2
549 #define ONIG_META_CHAR_ZERO_OR_ONE_TIME     3
550 #define ONIG_META_CHAR_ONE_OR_MORE_TIME     4
551 #define ONIG_META_CHAR_ANYCHAR_ANYTIME      5
552 
553 #define ONIG_INEFFECTIVE_META_CHAR          0
554 
555 /* error codes */
556 #define ONIG_IS_PATTERN_ERROR(ecode)   ((ecode) <= -100 && (ecode) > -1000)
557 
558 /* normal return */
559 #define ONIG_NORMAL                                            0
560 #define ONIG_VALUE_IS_NOT_SET                                  1
561 #define ONIG_MISMATCH                                         -1
562 #define ONIG_NO_SUPPORT_CONFIG                                -2
563 #define ONIG_ABORT                                            -3
564 
565 /* internal error */
566 #define ONIGERR_MEMORY                                         -5
567 #define ONIGERR_TYPE_BUG                                       -6
568 #define ONIGERR_PARSER_BUG                                    -11
569 #define ONIGERR_STACK_BUG                                     -12
570 #define ONIGERR_UNDEFINED_BYTECODE                            -13
571 #define ONIGERR_UNEXPECTED_BYTECODE                           -14
572 #define ONIGERR_MATCH_STACK_LIMIT_OVER                        -15
573 #define ONIGERR_PARSE_DEPTH_LIMIT_OVER                        -16
574 #define ONIGERR_RETRY_LIMIT_IN_MATCH_OVER                     -17
575 #define ONIGERR_RETRY_LIMIT_IN_SEARCH_OVER                    -18
576 #define ONIGERR_SUBEXP_CALL_LIMIT_IN_SEARCH_OVER              -19
577 #define ONIGERR_DEFAULT_ENCODING_IS_NOT_SETTED                -21
578 #define ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR  -22
579 #define ONIGERR_FAIL_TO_INITIALIZE                            -23
580 /* general error */
581 #define ONIGERR_INVALID_ARGUMENT                              -30
582 /* syntax error */
583 #define ONIGERR_END_PATTERN_AT_LEFT_BRACE                    -100
584 #define ONIGERR_END_PATTERN_AT_LEFT_BRACKET                  -101
585 #define ONIGERR_EMPTY_CHAR_CLASS                             -102
586 #define ONIGERR_PREMATURE_END_OF_CHAR_CLASS                  -103
587 #define ONIGERR_END_PATTERN_AT_ESCAPE                        -104
588 #define ONIGERR_END_PATTERN_AT_META                          -105
589 #define ONIGERR_END_PATTERN_AT_CONTROL                       -106
590 #define ONIGERR_META_CODE_SYNTAX                             -108
591 #define ONIGERR_CONTROL_CODE_SYNTAX                          -109
592 #define ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE             -110
593 #define ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE           -111
594 #define ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS      -112
595 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED      -113
596 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID            -114
597 #define ONIGERR_NESTED_REPEAT_OPERATOR                       -115
598 #define ONIGERR_UNMATCHED_CLOSE_PARENTHESIS                  -116
599 #define ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS       -117
600 #define ONIGERR_END_PATTERN_IN_GROUP                         -118
601 #define ONIGERR_UNDEFINED_GROUP_OPTION                       -119
602 #define ONIGERR_INVALID_POSIX_BRACKET_TYPE                   -121
603 #define ONIGERR_INVALID_LOOK_BEHIND_PATTERN                  -122
604 #define ONIGERR_INVALID_REPEAT_RANGE_PATTERN                 -123
605 /* values error (syntax error) */
606 #define ONIGERR_TOO_BIG_NUMBER                               -200
607 #define ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE              -201
608 #define ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE     -202
609 #define ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS                    -203
610 #define ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE          -204
611 #define ONIGERR_TOO_MANY_MULTI_BYTE_RANGES                   -205
612 #define ONIGERR_TOO_SHORT_MULTI_BYTE_STRING                  -206
613 #define ONIGERR_TOO_BIG_BACKREF_NUMBER                       -207
614 #define ONIGERR_INVALID_BACKREF                              -208
615 #define ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED         -209
616 #define ONIGERR_TOO_MANY_CAPTURES                            -210
617 #define ONIGERR_TOO_LONG_WIDE_CHAR_VALUE                     -212
618 #define ONIGERR_UNDEFINED_OPERATOR                           -213
619 #define ONIGERR_EMPTY_GROUP_NAME                             -214
620 #define ONIGERR_INVALID_GROUP_NAME                           -215
621 #define ONIGERR_INVALID_CHAR_IN_GROUP_NAME                   -216
622 #define ONIGERR_UNDEFINED_NAME_REFERENCE                     -217
623 #define ONIGERR_UNDEFINED_GROUP_REFERENCE                    -218
624 #define ONIGERR_MULTIPLEX_DEFINED_NAME                       -219
625 #define ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL               -220
626 #define ONIGERR_NEVER_ENDING_RECURSION                       -221
627 #define ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY        -222
628 #define ONIGERR_INVALID_CHAR_PROPERTY_NAME                   -223
629 #define ONIGERR_INVALID_IF_ELSE_SYNTAX                       -224
630 #define ONIGERR_INVALID_ABSENT_GROUP_PATTERN                 -225
631 #define ONIGERR_INVALID_ABSENT_GROUP_GENERATOR_PATTERN       -226
632 #define ONIGERR_INVALID_CALLOUT_PATTERN                      -227
633 #define ONIGERR_INVALID_CALLOUT_NAME                         -228
634 #define ONIGERR_UNDEFINED_CALLOUT_NAME                       -229
635 #define ONIGERR_INVALID_CALLOUT_BODY                         -230
636 #define ONIGERR_INVALID_CALLOUT_TAG_NAME                     -231
637 #define ONIGERR_INVALID_CALLOUT_ARG                          -232
638 #define ONIGERR_INVALID_CODE_POINT_VALUE                     -400
639 #define ONIGERR_INVALID_WIDE_CHAR_VALUE                      -400
640 #define ONIGERR_TOO_BIG_WIDE_CHAR_VALUE                      -401
641 #define ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION           -402
642 #define ONIGERR_INVALID_COMBINATION_OF_OPTIONS               -403
643 #define ONIGERR_TOO_MANY_USER_DEFINED_OBJECTS                -404
644 #define ONIGERR_TOO_LONG_PROPERTY_NAME                       -405
645 #define ONIGERR_VERY_INEFFICIENT_PATTERN                     -406
646 #define ONIGERR_LIBRARY_IS_NOT_INITIALIZED                   -500
647 
648 /* errors related to thread */
649 /* #define ONIGERR_OVER_THREAD_PASS_LIMIT_COUNT                -1001 */
650 
651 
652 /* must be smaller than MEM_STATUS_BITS_NUM (unsigned int * 8) */
653 #define ONIG_MAX_CAPTURE_HISTORY_GROUP   31
654 #define ONIG_IS_CAPTURE_HISTORY_GROUP(r, i) \
655   ((i) <= ONIG_MAX_CAPTURE_HISTORY_GROUP && (r)->list && (r)->list[i])
656 
657 typedef struct OnigCaptureTreeNodeStruct {
658   int group;   /* group number */
659   int beg;
660   int end;
661   int allocated;
662   int num_childs;
663   struct OnigCaptureTreeNodeStruct** childs;
664 } OnigCaptureTreeNode;
665 
666 /* match result region type */
667 struct re_registers {
668   int  allocated;
669   int  num_regs;
670   int* beg;
671   int* end;
672   /* extended */
673   OnigCaptureTreeNode* history_root;  /* capture history tree root */
674 };
675 
676 /* capture tree traverse */
677 #define ONIG_TRAVERSE_CALLBACK_AT_FIRST   1
678 #define ONIG_TRAVERSE_CALLBACK_AT_LAST    2
679 #define ONIG_TRAVERSE_CALLBACK_AT_BOTH \
680   ( ONIG_TRAVERSE_CALLBACK_AT_FIRST | ONIG_TRAVERSE_CALLBACK_AT_LAST )
681 
682 
683 #define ONIG_REGION_NOTPOS            -1
684 
685 typedef struct re_registers   OnigRegion;
686 
687 typedef struct {
688   OnigEncoding enc;
689   OnigUChar* par;
690   OnigUChar* par_end;
691 } OnigErrorInfo;
692 
693 typedef struct {
694   int lower;
695   int upper;
696 } OnigRepeatRange;
697 
698 typedef void (*OnigWarnFunc) P_((const char* s));
699 extern void onig_null_warn P_((const char* s));
700 #define ONIG_NULL_WARN       onig_null_warn
701 
702 #define ONIG_CHAR_TABLE_SIZE   256
703 
704 struct re_pattern_buffer;
705 typedef struct re_pattern_buffer OnigRegexType;
706 typedef OnigRegexType*  OnigRegex;
707 
708 #ifndef ONIG_ESCAPE_REGEX_T_COLLISION
709   typedef OnigRegexType  regex_t;
710 #endif
711 
712 struct OnigRegSetStruct;
713 typedef struct OnigRegSetStruct OnigRegSet;
714 
715 typedef enum {
716   ONIG_REGSET_POSITION_LEAD = 0,
717   ONIG_REGSET_REGEX_LEAD    = 1,
718   ONIG_REGSET_PRIORITY_TO_REGEX_ORDER = 2
719 } OnigRegSetLead;
720 
721 typedef struct {
722   int             num_of_elements;
723   OnigEncoding    pattern_enc;
724   OnigEncoding    target_enc;
725   OnigSyntaxType* syntax;
726   OnigOptionType  option;
727   OnigCaseFoldType   case_fold_flag;
728 } OnigCompileInfo;
729 
730 typedef int (*OnigCallbackEachMatchFunc)(const UChar* str, const UChar* end, const UChar* match_start, OnigRegion* region, void* user_data);
731 
732 
733 /* types for callout */
734 typedef enum {
735   ONIG_CALLOUT_IN_PROGRESS   = 1, /* 1<<0 */
736   ONIG_CALLOUT_IN_RETRACTION = 2  /* 1<<1 */
737 } OnigCalloutIn;
738 
739 #define ONIG_CALLOUT_IN_BOTH  (ONIG_CALLOUT_IN_PROGRESS | ONIG_CALLOUT_IN_RETRACTION)
740 
741 typedef enum {
742   ONIG_CALLOUT_OF_CONTENTS = 0,
743   ONIG_CALLOUT_OF_NAME     = 1
744 } OnigCalloutOf;
745 
746 typedef enum {
747   ONIG_CALLOUT_TYPE_SINGLE              = 0,
748   ONIG_CALLOUT_TYPE_START_CALL          = 1,
749   ONIG_CALLOUT_TYPE_BOTH_CALL           = 2,
750   ONIG_CALLOUT_TYPE_START_MARK_END_CALL = 3,
751 } OnigCalloutType;
752 
753 
754 #define ONIG_NON_NAME_ID        -1
755 #define ONIG_NON_CALLOUT_NUM     0
756 
757 #define ONIG_CALLOUT_MAX_ARGS_NUM     4
758 #define ONIG_CALLOUT_DATA_SLOT_NUM    5
759 
760 struct OnigCalloutArgsStruct;
761 typedef struct OnigCalloutArgsStruct OnigCalloutArgs;
762 
763 typedef int (*OnigCalloutFunc)(OnigCalloutArgs* args, void* user_data);
764 
765 /* callout function return values (less than -1: error code) */
766 typedef enum {
767   ONIG_CALLOUT_FAIL     =  1,
768   ONIG_CALLOUT_SUCCESS  =  0
769 } OnigCalloutResult;
770 
771 typedef enum {
772   ONIG_TYPE_VOID     = 0,
773   ONIG_TYPE_LONG     = 1<<0,
774   ONIG_TYPE_CHAR     = 1<<1,
775   ONIG_TYPE_STRING   = 1<<2,
776   ONIG_TYPE_POINTER  = 1<<3,
777   ONIG_TYPE_TAG      = 1<<4,
778 } OnigType;
779 
780 typedef union {
781   long l;
782   OnigCodePoint c;
783   struct {
784     OnigUChar* start;
785     OnigUChar* end;
786   } s;
787   void* p;
788   int tag;  /* tag -> callout_num */
789 } OnigValue;
790 
791 
792 struct OnigMatchParamStruct;
793 typedef struct OnigMatchParamStruct OnigMatchParam;
794 
795 
796 /* Oniguruma Native API */
797 
798 ONIG_EXTERN
799 int onig_initialize P_((OnigEncoding encodings[], int number_of_encodings));
800 /* onig_init(): deprecated function. Use onig_initialize(). */
801 ONIG_EXTERN
802 int onig_init P_((void));
803 ONIG_EXTERN
804 int ONIG_VARIADIC_FUNC_ATTR onig_error_code_to_str PV_((OnigUChar* s, int err_code, ...));
805 ONIG_EXTERN
806 int onig_is_error_code_needs_param PV_((int code));
807 ONIG_EXTERN
808 void onig_set_warn_func P_((OnigWarnFunc f));
809 ONIG_EXTERN
810 void onig_set_verb_warn_func P_((OnigWarnFunc f));
811 ONIG_EXTERN
812 int onig_new P_((OnigRegex*, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo));
813 ONIG_EXTERN
814 int  onig_reg_init P_((OnigRegex reg, OnigOptionType option, OnigCaseFoldType case_fold_flag, OnigEncoding enc, OnigSyntaxType* syntax));
815 int onig_new_without_alloc P_((OnigRegex, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo));
816 ONIG_EXTERN
817 int onig_new_deluxe P_((OnigRegex* reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo));
818 ONIG_EXTERN
819 void onig_free P_((OnigRegex));
820 ONIG_EXTERN
821 void onig_free_body P_((OnigRegex));
822 ONIG_EXTERN
823 int onig_scan(OnigRegex reg, const OnigUChar* str, const OnigUChar* end, OnigRegion* region, OnigOptionType option, int (*scan_callback)(int, int, OnigRegion*, void*), void* callback_arg);
824 ONIG_EXTERN
825 int onig_search P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option));
826 ONIG_EXTERN
827 int onig_search_with_param P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option, OnigMatchParam* mp));
828 ONIG_EXTERN
829 int onig_match P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option));
830 ONIG_EXTERN
831 int onig_match_with_param P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option, OnigMatchParam* mp));
832 
833 ONIG_EXTERN
834 int onig_regset_new P_((OnigRegSet** rset, int n, regex_t* regs[]));
835 ONIG_EXTERN
836 int onig_regset_add P_((OnigRegSet* set, regex_t* reg));
837 ONIG_EXTERN
838 int onig_regset_replace P_((OnigRegSet* set, int at, regex_t* reg));
839 ONIG_EXTERN
840 void onig_regset_free P_((OnigRegSet* set));
841 ONIG_EXTERN
842 int onig_regset_number_of_regex P_((OnigRegSet* set));
843 ONIG_EXTERN
844 regex_t* onig_regset_get_regex P_((OnigRegSet* set, int at));
845 ONIG_EXTERN
846 OnigRegion* onig_regset_get_region P_((OnigRegSet* set, int at));
847 ONIG_EXTERN
848 int onig_regset_search P_((OnigRegSet* set, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegSetLead lead, OnigOptionType option, int* rmatch_pos));
849 ONIG_EXTERN
850 int onig_regset_search_with_param P_((OnigRegSet* set, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range,  OnigRegSetLead lead, OnigOptionType option, OnigMatchParam* mps[], int* rmatch_pos));
851 
852 ONIG_EXTERN
853 OnigRegion* onig_region_new P_((void));
854 ONIG_EXTERN
855 void onig_region_init P_((OnigRegion* region));
856 ONIG_EXTERN
857 void onig_region_free P_((OnigRegion* region, int free_self));
858 ONIG_EXTERN
859 void onig_region_copy P_((OnigRegion* to, OnigRegion* from));
860 ONIG_EXTERN
861 void onig_region_clear P_((OnigRegion* region));
862 ONIG_EXTERN
863 int onig_region_resize P_((OnigRegion* region, int n));
864 ONIG_EXTERN
865 int onig_region_set P_((OnigRegion* region, int at, int beg, int end));
866 ONIG_EXTERN
867 int onig_name_to_group_numbers P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, int** nums));
868 ONIG_EXTERN
869 int onig_name_to_backref_number P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, OnigRegion *region));
870 ONIG_EXTERN
871 int onig_foreach_name P_((OnigRegex reg, int (*func)(const OnigUChar*, const OnigUChar*,int,int*,OnigRegex,void*), void* arg));
872 ONIG_EXTERN
873 int onig_number_of_names P_((OnigRegex reg));
874 ONIG_EXTERN
875 int onig_number_of_captures P_((OnigRegex reg));
876 ONIG_EXTERN
877 int onig_number_of_capture_histories P_((OnigRegex reg));
878 ONIG_EXTERN
879 OnigCaptureTreeNode* onig_get_capture_tree P_((OnigRegion* region));
880 ONIG_EXTERN
881 int onig_capture_tree_traverse P_((OnigRegion* region, int at, int(*callback_func)(int,int,int,int,int,void*), void* arg));
882 ONIG_EXTERN
883 int onig_noname_group_capture_is_active P_((OnigRegex reg));
884 ONIG_EXTERN
885 OnigEncoding onig_get_encoding P_((OnigRegex reg));
886 ONIG_EXTERN
887 OnigOptionType onig_get_options P_((OnigRegex reg));
888 ONIG_EXTERN
889 OnigCaseFoldType onig_get_case_fold_flag P_((OnigRegex reg));
890 ONIG_EXTERN
891 OnigSyntaxType* onig_get_syntax P_((OnigRegex reg));
892 ONIG_EXTERN
893 int onig_set_default_syntax P_((OnigSyntaxType* syntax));
894 ONIG_EXTERN
895 void onig_copy_syntax P_((OnigSyntaxType* to, OnigSyntaxType* from));
896 ONIG_EXTERN
897 unsigned int onig_get_syntax_op P_((OnigSyntaxType* syntax));
898 ONIG_EXTERN
899 unsigned int onig_get_syntax_op2 P_((OnigSyntaxType* syntax));
900 ONIG_EXTERN
901 unsigned int onig_get_syntax_behavior P_((OnigSyntaxType* syntax));
902 ONIG_EXTERN
903 OnigOptionType onig_get_syntax_options P_((OnigSyntaxType* syntax));
904 ONIG_EXTERN
905 void onig_set_syntax_op P_((OnigSyntaxType* syntax, unsigned int op));
906 ONIG_EXTERN
907 void onig_set_syntax_op2 P_((OnigSyntaxType* syntax, unsigned int op2));
908 ONIG_EXTERN
909 void onig_set_syntax_behavior P_((OnigSyntaxType* syntax, unsigned int behavior));
910 ONIG_EXTERN
911 void onig_set_syntax_options P_((OnigSyntaxType* syntax, OnigOptionType options));
912 ONIG_EXTERN
913 int onig_set_meta_char P_((OnigSyntaxType* syntax, unsigned int what, OnigCodePoint code));
914 ONIG_EXTERN
915 void onig_copy_encoding P_((OnigEncoding to, OnigEncoding from));
916 ONIG_EXTERN
917 OnigCaseFoldType onig_get_default_case_fold_flag P_((void));
918 ONIG_EXTERN
919 int onig_set_default_case_fold_flag P_((OnigCaseFoldType case_fold_flag));
920 ONIG_EXTERN
921 unsigned int onig_get_match_stack_limit_size P_((void));
922 ONIG_EXTERN
923 int onig_set_match_stack_limit_size P_((unsigned int size));
924 ONIG_EXTERN
925 unsigned long onig_get_retry_limit_in_match P_((void));
926 ONIG_EXTERN
927 int onig_set_retry_limit_in_match P_((unsigned long n));
928 ONIG_EXTERN
929 unsigned long onig_get_retry_limit_in_search P_((void));
930 ONIG_EXTERN
931 int onig_set_retry_limit_in_search P_((unsigned long n));
932 ONIG_EXTERN
933 unsigned int onig_get_parse_depth_limit P_((void));
934 ONIG_EXTERN
935 int onig_set_capture_num_limit P_((int num));
936 ONIG_EXTERN
937 int onig_set_parse_depth_limit P_((unsigned int depth));
938 ONIG_EXTERN
939 unsigned long onig_get_subexp_call_limit_in_search P_((void));
940 ONIG_EXTERN
941 int onig_set_subexp_call_limit_in_search P_((unsigned long n));
942 ONIG_EXTERN
943 int onig_get_subexp_call_max_nest_level P_((void));
944 ONIG_EXTERN
945 int onig_set_subexp_call_max_nest_level P_((int level));
946 ONIG_EXTERN
947 int onig_unicode_define_user_property P_((const char* name, OnigCodePoint* ranges));
948 ONIG_EXTERN
949 int onig_end P_((void));
950 ONIG_EXTERN
951 const char* onig_version P_((void));
952 ONIG_EXTERN
953 const char* onig_copyright P_((void));
954 
955 /* for callback each match */
956 ONIG_EXTERN
957 OnigCallbackEachMatchFunc onig_get_callback_each_match P_((void));
958 ONIG_EXTERN
959 int onig_set_callback_each_match P_((OnigCallbackEachMatchFunc f));
960 
961 /* for OnigMatchParam */
962 ONIG_EXTERN
963 OnigMatchParam* onig_new_match_param P_((void));
964 ONIG_EXTERN
965 void onig_free_match_param P_((OnigMatchParam* p));
966 ONIG_EXTERN
967 void onig_free_match_param_content P_((OnigMatchParam* p));
968 ONIG_EXTERN
969 int onig_initialize_match_param P_((OnigMatchParam* mp));
970 ONIG_EXTERN
971 int onig_set_match_stack_limit_size_of_match_param P_((OnigMatchParam* param, unsigned int limit));
972 ONIG_EXTERN
973 int onig_set_retry_limit_in_match_of_match_param P_((OnigMatchParam* param, unsigned long limit));
974 ONIG_EXTERN
975 int onig_set_retry_limit_in_search_of_match_param P_((OnigMatchParam* param, unsigned long limit));
976 ONIG_EXTERN
977 int onig_set_progress_callout_of_match_param P_((OnigMatchParam* param, OnigCalloutFunc f));
978 ONIG_EXTERN
979 int onig_set_retraction_callout_of_match_param P_((OnigMatchParam* param, OnigCalloutFunc f));
980 ONIG_EXTERN
981 int onig_set_callout_user_data_of_match_param P_((OnigMatchParam* param, void* user_data));
982 
983 /* for callout functions */
984 ONIG_EXTERN
985 OnigCalloutFunc onig_get_progress_callout P_((void));
986 ONIG_EXTERN
987 int onig_set_progress_callout P_((OnigCalloutFunc f));
988 ONIG_EXTERN
989 OnigCalloutFunc onig_get_retraction_callout P_((void));
990 ONIG_EXTERN
991 int onig_set_retraction_callout P_((OnigCalloutFunc f));
992 ONIG_EXTERN
993 int onig_set_callout_of_name P_((OnigEncoding enc, OnigCalloutType type, OnigUChar* name, OnigUChar* name_end, int callout_in, OnigCalloutFunc callout, OnigCalloutFunc end_callout, int arg_num, unsigned int arg_types[], int optional_arg_num, OnigValue opt_defaults[]));
994 ONIG_EXTERN
995 OnigUChar* onig_get_callout_name_by_name_id P_((int id));
996 ONIG_EXTERN
997 int onig_get_callout_num_by_tag P_((OnigRegex reg, const OnigUChar* tag, const OnigUChar* tag_end));
998 ONIG_EXTERN
999 int onig_get_callout_data_by_tag P_((OnigRegex reg, OnigMatchParam* mp, const OnigUChar* tag, const OnigUChar* tag_end, int slot, OnigType* type, OnigValue* val));
1000 ONIG_EXTERN
1001 int onig_set_callout_data_by_tag P_((OnigRegex reg, OnigMatchParam* mp, const OnigUChar* tag, const OnigUChar* tag_end, int slot, OnigType type, OnigValue* val));
1002 ONIG_EXTERN
1003 int onig_get_callout_data_by_tag_dont_clear_old P_((regex_t* reg, OnigMatchParam* mp, const UChar* tag, const UChar* tag_end, int slot, OnigType* type, OnigValue* val));
1004 
1005 /* used in callout functions */
1006 ONIG_EXTERN
1007 int onig_get_callout_num_by_callout_args P_((OnigCalloutArgs* args));
1008 ONIG_EXTERN
1009 OnigCalloutIn onig_get_callout_in_by_callout_args P_((OnigCalloutArgs* args));
1010 ONIG_EXTERN
1011 int onig_get_name_id_by_callout_args P_((OnigCalloutArgs* args));
1012 ONIG_EXTERN
1013 const OnigUChar* onig_get_contents_by_callout_args P_((OnigCalloutArgs* args));
1014 ONIG_EXTERN
1015 const OnigUChar* onig_get_contents_end_by_callout_args P_((OnigCalloutArgs* args));
1016 ONIG_EXTERN
1017 int onig_get_args_num_by_callout_args P_((OnigCalloutArgs* args));
1018 ONIG_EXTERN
1019 int onig_get_passed_args_num_by_callout_args P_((OnigCalloutArgs* args));
1020 ONIG_EXTERN
1021 int onig_get_arg_by_callout_args P_((OnigCalloutArgs* args, int index, OnigType* type, OnigValue* val));
1022 ONIG_EXTERN
1023 const OnigUChar* onig_get_string_by_callout_args P_((OnigCalloutArgs* args));
1024 ONIG_EXTERN
1025 const OnigUChar* onig_get_string_end_by_callout_args P_((OnigCalloutArgs* args));
1026 ONIG_EXTERN
1027 const OnigUChar* onig_get_start_by_callout_args P_((OnigCalloutArgs* args));
1028 ONIG_EXTERN
1029 const OnigUChar* onig_get_right_range_by_callout_args P_((OnigCalloutArgs* args));
1030 ONIG_EXTERN
1031 const OnigUChar* onig_get_current_by_callout_args P_((OnigCalloutArgs* args));
1032 ONIG_EXTERN
1033 OnigRegex onig_get_regex_by_callout_args P_((OnigCalloutArgs* args));
1034 ONIG_EXTERN
1035 unsigned long onig_get_retry_counter_by_callout_args P_((OnigCalloutArgs* args));
1036 ONIG_EXTERN
1037 int onig_callout_tag_is_exist_at_callout_num P_((OnigRegex reg, int callout_num));
1038 ONIG_EXTERN
1039 const OnigUChar* onig_get_callout_tag_start P_((OnigRegex reg, int callout_num));
1040 ONIG_EXTERN
1041 const OnigUChar* onig_get_callout_tag_end P_((OnigRegex reg, int callout_num));
1042 ONIG_EXTERN
1043 int onig_get_callout_data_dont_clear_old P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType* type, OnigValue* val));
1044 ONIG_EXTERN
1045 int onig_get_callout_data_by_callout_args_self_dont_clear_old P_((OnigCalloutArgs* args, int slot, OnigType* type, OnigValue* val));
1046 ONIG_EXTERN
1047 int onig_get_callout_data P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType* type, OnigValue* val));
1048 ONIG_EXTERN
1049 int onig_get_callout_data_by_callout_args P_((OnigCalloutArgs* args, int callout_num, int slot, OnigType* type, OnigValue* val));
1050 ONIG_EXTERN
1051 int onig_get_callout_data_by_callout_args_self P_((OnigCalloutArgs* args, int slot, OnigType* type, OnigValue* val));
1052 ONIG_EXTERN
1053 int onig_set_callout_data P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType type, OnigValue* val));
1054 ONIG_EXTERN
1055 int onig_set_callout_data_by_callout_args P_((OnigCalloutArgs* args, int callout_num, int slot, OnigType type, OnigValue* val));
1056 ONIG_EXTERN
1057 int onig_set_callout_data_by_callout_args_self P_((OnigCalloutArgs* args, int slot, OnigType type, OnigValue* val));
1058 ONIG_EXTERN
1059 int onig_get_capture_range_in_callout P_((OnigCalloutArgs* args, int mem_num, int* begin, int* end));
1060 ONIG_EXTERN
1061 int onig_get_used_stack_size_in_callout P_((OnigCalloutArgs* args, int* used_num, int* used_bytes));
1062 
1063 /* builtin callout functions */
1064 ONIG_EXTERN
1065 int onig_builtin_fail P_((OnigCalloutArgs* args, void* user_data));
1066 ONIG_EXTERN
1067 int onig_builtin_mismatch P_((OnigCalloutArgs* args, void* user_data));
1068 ONIG_EXTERN
1069 int onig_builtin_error P_((OnigCalloutArgs* args, void* user_data));
1070 ONIG_EXTERN
1071 int onig_builtin_count P_((OnigCalloutArgs* args, void* user_data));
1072 ONIG_EXTERN
1073 int onig_builtin_total_count P_((OnigCalloutArgs* args, void* user_data));
1074 ONIG_EXTERN
1075 int onig_builtin_max P_((OnigCalloutArgs* args, void* user_data));
1076 ONIG_EXTERN
1077 int onig_builtin_cmp P_((OnigCalloutArgs* args, void* user_data));
1078 
1079 ONIG_EXTERN
1080 int onig_setup_builtin_monitors_by_ascii_encoded_name P_((void* fp));
1081 
1082 #ifdef __cplusplus
1083 }
1084 #endif
1085 
1086 #endif /* ONIGURUMA_H */
1087