1 #ifndef ONIGURUMA_H 2 #define ONIGURUMA_H 3 /********************************************************************** 4 oniguruma.h - Oniguruma (regular expression library) 5 **********************************************************************/ 6 /*- 7 * Copyright (c) 2002-2018 K.Kosako <sndgk393 AT ybb DOT ne DOT jp> 8 * All rights reserved. 9 * 10 * Redistribution and use in source and binary forms, with or without 11 * modification, are permitted provided that the following conditions 12 * are met: 13 * 1. Redistributions of source code must retain the above copyright 14 * notice, this list of conditions and the following disclaimer. 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in the 17 * documentation and/or other materials provided with the distribution. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 32 #ifdef __cplusplus 33 extern "C" { 34 #endif 35 36 #define ONIGURUMA 37 #define ONIGURUMA_VERSION_MAJOR 6 38 #define ONIGURUMA_VERSION_MINOR 9 39 #define ONIGURUMA_VERSION_TEENY 1 40 41 #define ONIGURUMA_VERSION_INT 60901 42 43 #ifndef P_ 44 #if defined(__STDC__) || defined(_WIN32) 45 # define P_(args) args 46 #else 47 # define P_(args) () 48 #endif 49 #endif 50 51 #ifndef PV_ 52 # define PV_(args) args 53 #endif 54 55 #ifndef ONIG_EXTERN 56 #if defined(_WIN32) && !defined(__GNUC__) 57 #if defined(ONIGURUMA_EXPORT) 58 #define ONIG_EXTERN extern __declspec(dllexport) 59 #else 60 #define ONIG_EXTERN extern __declspec(dllimport) 61 #endif 62 #endif 63 #endif 64 65 #ifndef ONIG_EXTERN 66 #define ONIG_EXTERN extern 67 #endif 68 69 /* PART: character encoding */ 70 71 #ifndef ONIG_ESCAPE_UCHAR_COLLISION 72 #define UChar OnigUChar 73 #endif 74 75 typedef unsigned int OnigCodePoint; 76 typedef unsigned char OnigUChar; 77 typedef unsigned int OnigCtype; 78 typedef unsigned int OnigLen; 79 80 #define ONIG_INFINITE_DISTANCE ~((OnigLen )0) 81 82 typedef unsigned int OnigCaseFoldType; /* case fold flag */ 83 84 ONIG_EXTERN OnigCaseFoldType OnigDefaultCaseFoldFlag; 85 86 /* #define ONIGENC_CASE_FOLD_HIRAGANA_KATAKANA (1<<1) */ 87 /* #define ONIGENC_CASE_FOLD_KATAKANA_WIDTH (1<<2) */ 88 #define ONIGENC_CASE_FOLD_TURKISH_AZERI (1<<20) 89 #define INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR (1<<30) 90 91 #define ONIGENC_CASE_FOLD_MIN INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR 92 #define ONIGENC_CASE_FOLD_DEFAULT OnigDefaultCaseFoldFlag 93 94 95 #define ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN 3 96 #define ONIGENC_GET_CASE_FOLD_CODES_MAX_NUM 13 97 /* 13 => Unicode:0x1ffc */ 98 99 /* code range */ 100 #define ONIGENC_CODE_RANGE_NUM(range) ((int )range[0]) 101 #define ONIGENC_CODE_RANGE_FROM(range,i) range[((i)*2) + 1] 102 #define ONIGENC_CODE_RANGE_TO(range,i) range[((i)*2) + 2] 103 104 typedef struct { 105 int byte_len; /* argument(original) character(s) byte length */ 106 int code_len; /* number of code */ 107 OnigCodePoint code[ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN]; 108 } OnigCaseFoldCodeItem; 109 110 typedef struct { 111 OnigCodePoint esc; 112 OnigCodePoint anychar; 113 OnigCodePoint anytime; 114 OnigCodePoint zero_or_one_time; 115 OnigCodePoint one_or_more_time; 116 OnigCodePoint anychar_anytime; 117 } OnigMetaCharTableType; 118 119 typedef int (*OnigApplyAllCaseFoldFunc)(OnigCodePoint from, OnigCodePoint* to, int to_len, void* arg); 120 121 typedef struct OnigEncodingTypeST { 122 int (*mbc_enc_len)(const OnigUChar* p); 123 const char* name; 124 int max_enc_len; 125 int min_enc_len; 126 int (*is_mbc_newline)(const OnigUChar* p, const OnigUChar* end); 127 OnigCodePoint (*mbc_to_code)(const OnigUChar* p, const OnigUChar* end); 128 int (*code_to_mbclen)(OnigCodePoint code); 129 int (*code_to_mbc)(OnigCodePoint code, OnigUChar *buf); 130 int (*mbc_case_fold)(OnigCaseFoldType flag, const OnigUChar** pp, const OnigUChar* end, OnigUChar* to); 131 int (*apply_all_case_fold)(OnigCaseFoldType flag, OnigApplyAllCaseFoldFunc f, void* arg); 132 int (*get_case_fold_codes_by_str)(OnigCaseFoldType flag, const OnigUChar* p, const OnigUChar* end, OnigCaseFoldCodeItem acs[]); 133 int (*property_name_to_ctype)(struct OnigEncodingTypeST* enc, OnigUChar* p, OnigUChar* end); 134 int (*is_code_ctype)(OnigCodePoint code, OnigCtype ctype); 135 int (*get_ctype_code_range)(OnigCtype ctype, OnigCodePoint* sb_out, const OnigCodePoint* ranges[]); 136 OnigUChar* (*left_adjust_char_head)(const OnigUChar* start, const OnigUChar* p); 137 int (*is_allowed_reverse_match)(const OnigUChar* p, const OnigUChar* end); 138 int (*init)(void); 139 int (*is_initialized)(void); 140 int (*is_valid_mbc_string)(const OnigUChar* s, const OnigUChar* end); 141 unsigned int flag; 142 OnigCodePoint sb_range; 143 int index; 144 } OnigEncodingType; 145 146 typedef OnigEncodingType* OnigEncoding; 147 148 ONIG_EXTERN OnigEncodingType OnigEncodingASCII; 149 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_1; 150 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_2; 151 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_3; 152 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_4; 153 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_5; 154 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_6; 155 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_7; 156 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_8; 157 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_9; 158 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_10; 159 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_11; 160 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_13; 161 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_14; 162 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_15; 163 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_16; 164 ONIG_EXTERN OnigEncodingType OnigEncodingUTF8; 165 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_BE; 166 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_LE; 167 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_BE; 168 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_LE; 169 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_JP; 170 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_TW; 171 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_KR; 172 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_CN; 173 ONIG_EXTERN OnigEncodingType OnigEncodingSJIS; 174 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8; 175 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8_R; 176 ONIG_EXTERN OnigEncodingType OnigEncodingCP1251; 177 ONIG_EXTERN OnigEncodingType OnigEncodingBIG5; 178 ONIG_EXTERN OnigEncodingType OnigEncodingGB18030; 179 180 #define ONIG_ENCODING_ASCII (&OnigEncodingASCII) 181 #define ONIG_ENCODING_ISO_8859_1 (&OnigEncodingISO_8859_1) 182 #define ONIG_ENCODING_ISO_8859_2 (&OnigEncodingISO_8859_2) 183 #define ONIG_ENCODING_ISO_8859_3 (&OnigEncodingISO_8859_3) 184 #define ONIG_ENCODING_ISO_8859_4 (&OnigEncodingISO_8859_4) 185 #define ONIG_ENCODING_ISO_8859_5 (&OnigEncodingISO_8859_5) 186 #define ONIG_ENCODING_ISO_8859_6 (&OnigEncodingISO_8859_6) 187 #define ONIG_ENCODING_ISO_8859_7 (&OnigEncodingISO_8859_7) 188 #define ONIG_ENCODING_ISO_8859_8 (&OnigEncodingISO_8859_8) 189 #define ONIG_ENCODING_ISO_8859_9 (&OnigEncodingISO_8859_9) 190 #define ONIG_ENCODING_ISO_8859_10 (&OnigEncodingISO_8859_10) 191 #define ONIG_ENCODING_ISO_8859_11 (&OnigEncodingISO_8859_11) 192 #define ONIG_ENCODING_ISO_8859_13 (&OnigEncodingISO_8859_13) 193 #define ONIG_ENCODING_ISO_8859_14 (&OnigEncodingISO_8859_14) 194 #define ONIG_ENCODING_ISO_8859_15 (&OnigEncodingISO_8859_15) 195 #define ONIG_ENCODING_ISO_8859_16 (&OnigEncodingISO_8859_16) 196 #define ONIG_ENCODING_UTF8 (&OnigEncodingUTF8) 197 #define ONIG_ENCODING_UTF16_BE (&OnigEncodingUTF16_BE) 198 #define ONIG_ENCODING_UTF16_LE (&OnigEncodingUTF16_LE) 199 #define ONIG_ENCODING_UTF32_BE (&OnigEncodingUTF32_BE) 200 #define ONIG_ENCODING_UTF32_LE (&OnigEncodingUTF32_LE) 201 #define ONIG_ENCODING_EUC_JP (&OnigEncodingEUC_JP) 202 #define ONIG_ENCODING_EUC_TW (&OnigEncodingEUC_TW) 203 #define ONIG_ENCODING_EUC_KR (&OnigEncodingEUC_KR) 204 #define ONIG_ENCODING_EUC_CN (&OnigEncodingEUC_CN) 205 #define ONIG_ENCODING_SJIS (&OnigEncodingSJIS) 206 #define ONIG_ENCODING_KOI8 (&OnigEncodingKOI8) 207 #define ONIG_ENCODING_KOI8_R (&OnigEncodingKOI8_R) 208 #define ONIG_ENCODING_CP1251 (&OnigEncodingCP1251) 209 #define ONIG_ENCODING_BIG5 (&OnigEncodingBIG5) 210 #define ONIG_ENCODING_GB18030 (&OnigEncodingGB18030) 211 212 #define ONIG_ENCODING_UNDEF ((OnigEncoding )0) 213 214 215 /* work size */ 216 #define ONIGENC_CODE_TO_MBC_MAXLEN 7 217 #define ONIGENC_MBC_CASE_FOLD_MAXLEN 18 218 /* 18: 6(max-byte) * 3(case-fold chars) */ 219 220 /* character types */ 221 typedef enum { 222 ONIGENC_CTYPE_NEWLINE = 0, 223 ONIGENC_CTYPE_ALPHA = 1, 224 ONIGENC_CTYPE_BLANK = 2, 225 ONIGENC_CTYPE_CNTRL = 3, 226 ONIGENC_CTYPE_DIGIT = 4, 227 ONIGENC_CTYPE_GRAPH = 5, 228 ONIGENC_CTYPE_LOWER = 6, 229 ONIGENC_CTYPE_PRINT = 7, 230 ONIGENC_CTYPE_PUNCT = 8, 231 ONIGENC_CTYPE_SPACE = 9, 232 ONIGENC_CTYPE_UPPER = 10, 233 ONIGENC_CTYPE_XDIGIT = 11, 234 ONIGENC_CTYPE_WORD = 12, 235 ONIGENC_CTYPE_ALNUM = 13, /* alpha || digit */ 236 ONIGENC_CTYPE_ASCII = 14 237 } OnigEncCtype; 238 239 #define ONIGENC_MAX_STD_CTYPE ONIGENC_CTYPE_ASCII 240 241 242 #define onig_enc_len(enc,p,end) ONIGENC_MBC_ENC_LEN(enc,p) 243 244 #define ONIGENC_IS_UNDEF(enc) ((enc) == ONIG_ENCODING_UNDEF) 245 #define ONIGENC_IS_SINGLEBYTE(enc) (ONIGENC_MBC_MAXLEN(enc) == 1) 246 #define ONIGENC_IS_MBC_HEAD(enc,p) (ONIGENC_MBC_ENC_LEN(enc,p) != 1) 247 #define ONIGENC_IS_MBC_ASCII(p) (*(p) < 128) 248 #define ONIGENC_IS_CODE_ASCII(code) ((code) < 128) 249 #define ONIGENC_IS_MBC_WORD(enc,s,end) \ 250 ONIGENC_IS_CODE_WORD(enc,ONIGENC_MBC_TO_CODE(enc,s,end)) 251 #define ONIGENC_IS_MBC_WORD_ASCII(enc,s,end) onigenc_is_mbc_word_ascii(enc,s,end) 252 253 #define ONIGENC_NAME(enc) ((enc)->name) 254 255 #define ONIGENC_MBC_CASE_FOLD(enc,flag,pp,end,buf) \ 256 (enc)->mbc_case_fold(flag,(const OnigUChar** )pp,end,buf) 257 #define ONIGENC_IS_ALLOWED_REVERSE_MATCH(enc,s,end) \ 258 (enc)->is_allowed_reverse_match(s,end) 259 #define ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc,start,s) \ 260 (enc)->left_adjust_char_head(start, s) 261 #define ONIGENC_IS_VALID_MBC_STRING(enc,s,end) \ 262 (enc)->is_valid_mbc_string(s,end) 263 #define ONIGENC_APPLY_ALL_CASE_FOLD(enc,case_fold_flag,f,arg) \ 264 (enc)->apply_all_case_fold(case_fold_flag,f,arg) 265 #define ONIGENC_GET_CASE_FOLD_CODES_BY_STR(enc,case_fold_flag,p,end,acs) \ 266 (enc)->get_case_fold_codes_by_str(case_fold_flag,p,end,acs) 267 #define ONIGENC_STEP_BACK(enc,start,s,n) \ 268 onigenc_step_back((enc),(start),(s),(n)) 269 270 #define ONIGENC_MBC_ENC_LEN(enc,p) (enc)->mbc_enc_len(p) 271 #define ONIGENC_MBC_MAXLEN(enc) ((enc)->max_enc_len) 272 #define ONIGENC_MBC_MAXLEN_DIST(enc) ONIGENC_MBC_MAXLEN(enc) 273 #define ONIGENC_MBC_MINLEN(enc) ((enc)->min_enc_len) 274 #define ONIGENC_IS_MBC_NEWLINE(enc,p,end) (enc)->is_mbc_newline((p),(end)) 275 #define ONIGENC_MBC_TO_CODE(enc,p,end) (enc)->mbc_to_code((p),(end)) 276 #define ONIGENC_CODE_TO_MBCLEN(enc,code) (enc)->code_to_mbclen(code) 277 #define ONIGENC_CODE_TO_MBC(enc,code,buf) (enc)->code_to_mbc(code,buf) 278 #define ONIGENC_PROPERTY_NAME_TO_CTYPE(enc,p,end) \ 279 (enc)->property_name_to_ctype(enc,p,end) 280 281 #define ONIGENC_IS_CODE_CTYPE(enc,code,ctype) (enc)->is_code_ctype(code,ctype) 282 283 #define ONIGENC_IS_CODE_NEWLINE(enc,code) \ 284 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_NEWLINE) 285 #define ONIGENC_IS_CODE_GRAPH(enc,code) \ 286 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_GRAPH) 287 #define ONIGENC_IS_CODE_PRINT(enc,code) \ 288 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PRINT) 289 #define ONIGENC_IS_CODE_ALNUM(enc,code) \ 290 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALNUM) 291 #define ONIGENC_IS_CODE_ALPHA(enc,code) \ 292 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALPHA) 293 #define ONIGENC_IS_CODE_LOWER(enc,code) \ 294 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_LOWER) 295 #define ONIGENC_IS_CODE_UPPER(enc,code) \ 296 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_UPPER) 297 #define ONIGENC_IS_CODE_CNTRL(enc,code) \ 298 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_CNTRL) 299 #define ONIGENC_IS_CODE_PUNCT(enc,code) \ 300 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PUNCT) 301 #define ONIGENC_IS_CODE_SPACE(enc,code) \ 302 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_SPACE) 303 #define ONIGENC_IS_CODE_BLANK(enc,code) \ 304 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_BLANK) 305 #define ONIGENC_IS_CODE_DIGIT(enc,code) \ 306 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_DIGIT) 307 #define ONIGENC_IS_CODE_XDIGIT(enc,code) \ 308 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_XDIGIT) 309 #define ONIGENC_IS_CODE_WORD(enc,code) \ 310 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_WORD) 311 312 #define ONIGENC_GET_CTYPE_CODE_RANGE(enc,ctype,sbout,ranges) \ 313 (enc)->get_ctype_code_range(ctype,sbout,ranges) 314 315 ONIG_EXTERN 316 OnigUChar* onigenc_step_back P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, int n)); 317 318 319 /* encoding API */ 320 ONIG_EXTERN 321 int onigenc_init P_((void)); 322 ONIG_EXTERN 323 int onig_initialize_encoding P_((OnigEncoding enc)); 324 ONIG_EXTERN 325 int onigenc_set_default_encoding P_((OnigEncoding enc)); 326 ONIG_EXTERN 327 OnigEncoding onigenc_get_default_encoding P_((void)); 328 ONIG_EXTERN 329 void onigenc_set_default_caseconv_table P_((const OnigUChar* table)); 330 ONIG_EXTERN 331 OnigUChar* onigenc_get_right_adjust_char_head_with_prev P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, const OnigUChar** prev)); 332 ONIG_EXTERN 333 OnigUChar* onigenc_get_prev_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 334 ONIG_EXTERN 335 OnigUChar* onigenc_get_left_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 336 ONIG_EXTERN 337 OnigUChar* onigenc_get_right_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 338 ONIG_EXTERN 339 int onigenc_strlen P_((OnigEncoding enc, const OnigUChar* p, const OnigUChar* end)); 340 ONIG_EXTERN 341 int onigenc_strlen_null P_((OnigEncoding enc, const OnigUChar* p)); 342 ONIG_EXTERN 343 int onigenc_str_bytelen_null P_((OnigEncoding enc, const OnigUChar* p)); 344 ONIG_EXTERN 345 int onigenc_is_valid_mbc_string P_((OnigEncoding enc, const OnigUChar* s, const OnigUChar* end)); 346 ONIG_EXTERN 347 OnigUChar* onigenc_strdup P_((OnigEncoding enc, const OnigUChar* s, const OnigUChar* end)); 348 349 350 /* PART: regular expression */ 351 352 /* config parameters */ 353 #define ONIG_NREGION 10 354 #define ONIG_MAX_CAPTURE_NUM 2147483647 /* 2**31 - 1 */ 355 #define ONIG_MAX_BACKREF_NUM 1000 356 #define ONIG_MAX_REPEAT_NUM 100000 357 #define ONIG_MAX_MULTI_BYTE_RANGES_NUM 10000 358 /* constants */ 359 #define ONIG_MAX_ERROR_MESSAGE_LEN 90 360 361 typedef unsigned int OnigOptionType; 362 363 #define ONIG_OPTION_DEFAULT ONIG_OPTION_NONE 364 365 /* options */ 366 #define ONIG_OPTION_NONE 0U 367 /* options (compile time) */ 368 #define ONIG_OPTION_IGNORECASE 1U 369 #define ONIG_OPTION_EXTEND (ONIG_OPTION_IGNORECASE << 1) 370 #define ONIG_OPTION_MULTILINE (ONIG_OPTION_EXTEND << 1) 371 #define ONIG_OPTION_SINGLELINE (ONIG_OPTION_MULTILINE << 1) 372 #define ONIG_OPTION_FIND_LONGEST (ONIG_OPTION_SINGLELINE << 1) 373 #define ONIG_OPTION_FIND_NOT_EMPTY (ONIG_OPTION_FIND_LONGEST << 1) 374 #define ONIG_OPTION_NEGATE_SINGLELINE (ONIG_OPTION_FIND_NOT_EMPTY << 1) 375 #define ONIG_OPTION_DONT_CAPTURE_GROUP (ONIG_OPTION_NEGATE_SINGLELINE << 1) 376 #define ONIG_OPTION_CAPTURE_GROUP (ONIG_OPTION_DONT_CAPTURE_GROUP << 1) 377 /* options (search time) */ 378 #define ONIG_OPTION_NOTBOL (ONIG_OPTION_CAPTURE_GROUP << 1) 379 #define ONIG_OPTION_NOTEOL (ONIG_OPTION_NOTBOL << 1) 380 #define ONIG_OPTION_POSIX_REGION (ONIG_OPTION_NOTEOL << 1) 381 #define ONIG_OPTION_CHECK_VALIDITY_OF_STRING (ONIG_OPTION_POSIX_REGION << 1) 382 /* #define ONIG_OPTION_CRLF_AS_LINE_SEPARATOR (ONIG_OPTION_CHECK_VALIDITY_OF_STRING << 1) */ 383 /* options (compile time) */ 384 #define ONIG_OPTION_WORD_IS_ASCII (ONIG_OPTION_CHECK_VALIDITY_OF_STRING << 4) 385 #define ONIG_OPTION_DIGIT_IS_ASCII (ONIG_OPTION_WORD_IS_ASCII << 1) 386 #define ONIG_OPTION_SPACE_IS_ASCII (ONIG_OPTION_DIGIT_IS_ASCII << 1) 387 #define ONIG_OPTION_POSIX_IS_ASCII (ONIG_OPTION_SPACE_IS_ASCII << 1) 388 389 #define ONIG_OPTION_MAXBIT ONIG_OPTION_POSIX_IS_ASCII /* limit */ 390 391 #define ONIG_OPTION_ON(options,regopt) ((options) |= (regopt)) 392 #define ONIG_OPTION_OFF(options,regopt) ((options) &= ~(regopt)) 393 #define ONIG_IS_OPTION_ON(options,option) ((options) & (option)) 394 395 /* syntax */ 396 typedef struct { 397 unsigned int op; 398 unsigned int op2; 399 unsigned int behavior; 400 OnigOptionType options; /* default option */ 401 OnigMetaCharTableType meta_char_table; 402 } OnigSyntaxType; 403 404 ONIG_EXTERN OnigSyntaxType OnigSyntaxASIS; 405 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixBasic; 406 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixExtended; 407 ONIG_EXTERN OnigSyntaxType OnigSyntaxEmacs; 408 ONIG_EXTERN OnigSyntaxType OnigSyntaxGrep; 409 ONIG_EXTERN OnigSyntaxType OnigSyntaxGnuRegex; 410 ONIG_EXTERN OnigSyntaxType OnigSyntaxJava; 411 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl; 412 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl_NG; 413 ONIG_EXTERN OnigSyntaxType OnigSyntaxRuby; 414 ONIG_EXTERN OnigSyntaxType OnigSyntaxOniguruma; 415 416 /* predefined syntaxes (see regsyntax.c) */ 417 #define ONIG_SYNTAX_ASIS (&OnigSyntaxASIS) 418 #define ONIG_SYNTAX_POSIX_BASIC (&OnigSyntaxPosixBasic) 419 #define ONIG_SYNTAX_POSIX_EXTENDED (&OnigSyntaxPosixExtended) 420 #define ONIG_SYNTAX_EMACS (&OnigSyntaxEmacs) 421 #define ONIG_SYNTAX_GREP (&OnigSyntaxGrep) 422 #define ONIG_SYNTAX_GNU_REGEX (&OnigSyntaxGnuRegex) 423 #define ONIG_SYNTAX_JAVA (&OnigSyntaxJava) 424 #define ONIG_SYNTAX_PERL (&OnigSyntaxPerl) 425 #define ONIG_SYNTAX_PERL_NG (&OnigSyntaxPerl_NG) 426 #define ONIG_SYNTAX_RUBY (&OnigSyntaxRuby) 427 #define ONIG_SYNTAX_ONIGURUMA (&OnigSyntaxOniguruma) 428 429 /* default syntax */ 430 ONIG_EXTERN OnigSyntaxType* OnigDefaultSyntax; 431 #define ONIG_SYNTAX_DEFAULT OnigDefaultSyntax 432 433 /* syntax (operators) */ 434 #define ONIG_SYN_OP_VARIABLE_META_CHARACTERS (1U<<0) 435 #define ONIG_SYN_OP_DOT_ANYCHAR (1U<<1) /* . */ 436 #define ONIG_SYN_OP_ASTERISK_ZERO_INF (1U<<2) /* * */ 437 #define ONIG_SYN_OP_ESC_ASTERISK_ZERO_INF (1U<<3) 438 #define ONIG_SYN_OP_PLUS_ONE_INF (1U<<4) /* + */ 439 #define ONIG_SYN_OP_ESC_PLUS_ONE_INF (1U<<5) 440 #define ONIG_SYN_OP_QMARK_ZERO_ONE (1U<<6) /* ? */ 441 #define ONIG_SYN_OP_ESC_QMARK_ZERO_ONE (1U<<7) 442 #define ONIG_SYN_OP_BRACE_INTERVAL (1U<<8) /* {lower,upper} */ 443 #define ONIG_SYN_OP_ESC_BRACE_INTERVAL (1U<<9) /* \{lower,upper\} */ 444 #define ONIG_SYN_OP_VBAR_ALT (1U<<10) /* | */ 445 #define ONIG_SYN_OP_ESC_VBAR_ALT (1U<<11) /* \| */ 446 #define ONIG_SYN_OP_LPAREN_SUBEXP (1U<<12) /* (...) */ 447 #define ONIG_SYN_OP_ESC_LPAREN_SUBEXP (1U<<13) /* \(...\) */ 448 #define ONIG_SYN_OP_ESC_AZ_BUF_ANCHOR (1U<<14) /* \A, \Z, \z */ 449 #define ONIG_SYN_OP_ESC_CAPITAL_G_BEGIN_ANCHOR (1U<<15) /* \G */ 450 #define ONIG_SYN_OP_DECIMAL_BACKREF (1U<<16) /* \num */ 451 #define ONIG_SYN_OP_BRACKET_CC (1U<<17) /* [...] */ 452 #define ONIG_SYN_OP_ESC_W_WORD (1U<<18) /* \w, \W */ 453 #define ONIG_SYN_OP_ESC_LTGT_WORD_BEGIN_END (1U<<19) /* \<. \> */ 454 #define ONIG_SYN_OP_ESC_B_WORD_BOUND (1U<<20) /* \b, \B */ 455 #define ONIG_SYN_OP_ESC_S_WHITE_SPACE (1U<<21) /* \s, \S */ 456 #define ONIG_SYN_OP_ESC_D_DIGIT (1U<<22) /* \d, \D */ 457 #define ONIG_SYN_OP_LINE_ANCHOR (1U<<23) /* ^, $ */ 458 #define ONIG_SYN_OP_POSIX_BRACKET (1U<<24) /* [:xxxx:] */ 459 #define ONIG_SYN_OP_QMARK_NON_GREEDY (1U<<25) /* ??,*?,+?,{n,m}? */ 460 #define ONIG_SYN_OP_ESC_CONTROL_CHARS (1U<<26) /* \n,\r,\t,\a ... */ 461 #define ONIG_SYN_OP_ESC_C_CONTROL (1U<<27) /* \cx */ 462 #define ONIG_SYN_OP_ESC_OCTAL3 (1U<<28) /* \OOO */ 463 #define ONIG_SYN_OP_ESC_X_HEX2 (1U<<29) /* \xHH */ 464 #define ONIG_SYN_OP_ESC_X_BRACE_HEX8 (1U<<30) /* \x{7HHHHHHH} */ 465 #define ONIG_SYN_OP_ESC_O_BRACE_OCTAL (1U<<31) /* \o{1OOOOOOOOOO} */ 466 467 #define ONIG_SYN_OP2_ESC_CAPITAL_Q_QUOTE (1U<<0) /* \Q...\E */ 468 #define ONIG_SYN_OP2_QMARK_GROUP_EFFECT (1U<<1) /* (?...) */ 469 #define ONIG_SYN_OP2_OPTION_PERL (1U<<2) /* (?imsx),(?-imsx) */ 470 #define ONIG_SYN_OP2_OPTION_RUBY (1U<<3) /* (?imx), (?-imx) */ 471 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_REPEAT (1U<<4) /* ?+,*+,++ */ 472 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_INTERVAL (1U<<5) /* {n,m}+ */ 473 #define ONIG_SYN_OP2_CCLASS_SET_OP (1U<<6) /* [...&&..[..]..] */ 474 #define ONIG_SYN_OP2_QMARK_LT_NAMED_GROUP (1U<<7) /* (?<name>...) */ 475 #define ONIG_SYN_OP2_ESC_K_NAMED_BACKREF (1U<<8) /* \k<name> */ 476 #define ONIG_SYN_OP2_ESC_G_SUBEXP_CALL (1U<<9) /* \g<name>, \g<n> */ 477 #define ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY (1U<<10) /* (?@..),(?@<x>..) */ 478 #define ONIG_SYN_OP2_ESC_CAPITAL_C_BAR_CONTROL (1U<<11) /* \C-x */ 479 #define ONIG_SYN_OP2_ESC_CAPITAL_M_BAR_META (1U<<12) /* \M-x */ 480 #define ONIG_SYN_OP2_ESC_V_VTAB (1U<<13) /* \v as VTAB */ 481 #define ONIG_SYN_OP2_ESC_U_HEX4 (1U<<14) /* \uHHHH */ 482 #define ONIG_SYN_OP2_ESC_GNU_BUF_ANCHOR (1U<<15) /* \`, \' */ 483 #define ONIG_SYN_OP2_ESC_P_BRACE_CHAR_PROPERTY (1U<<16) /* \p{...}, \P{...} */ 484 #define ONIG_SYN_OP2_ESC_P_BRACE_CIRCUMFLEX_NOT (1U<<17) /* \p{^..}, \P{^..} */ 485 /* #define ONIG_SYN_OP2_CHAR_PROPERTY_PREFIX_IS (1U<<18) */ 486 #define ONIG_SYN_OP2_ESC_H_XDIGIT (1U<<19) /* \h, \H */ 487 #define ONIG_SYN_OP2_INEFFECTIVE_ESCAPE (1U<<20) /* \ */ 488 #define ONIG_SYN_OP2_QMARK_LPAREN_IF_ELSE (1U<<21) /* (?(n)) (?(...)...|...) */ 489 #define ONIG_SYN_OP2_ESC_CAPITAL_K_KEEP (1U<<22) /* \K */ 490 #define ONIG_SYN_OP2_ESC_CAPITAL_R_GENERAL_NEWLINE (1U<<23) /* \R \r\n else [\x0a-\x0d] */ 491 #define ONIG_SYN_OP2_ESC_CAPITAL_N_O_SUPER_DOT (1U<<24) /* \N (?-m:.), \O (?m:.) */ 492 #define ONIG_SYN_OP2_QMARK_TILDE_ABSENT_GROUP (1U<<25) /* (?~...) */ 493 #define ONIG_SYN_OP2_ESC_X_Y_GRAPHEME_CLUSTER (1U<<26) /* \X \y \Y */ 494 #define ONIG_SYN_OP2_QMARK_PERL_SUBEXP_CALL (1U<<27) /* (?R), (?&name)... */ 495 #define ONIG_SYN_OP2_QMARK_BRACE_CALLOUT_CONTENTS (1U<<28) /* (?{...}) (?{{...}}) */ 496 #define ONIG_SYN_OP2_ASTERISK_CALLOUT_NAME (1U<<29) /* (*name) (*name{a,..}) */ 497 498 /* syntax (behavior) */ 499 #define ONIG_SYN_CONTEXT_INDEP_ANCHORS (1U<<31) /* not implemented */ 500 #define ONIG_SYN_CONTEXT_INDEP_REPEAT_OPS (1U<<0) /* ?, *, +, {n,m} */ 501 #define ONIG_SYN_CONTEXT_INVALID_REPEAT_OPS (1U<<1) /* error or ignore */ 502 #define ONIG_SYN_ALLOW_UNMATCHED_CLOSE_SUBEXP (1U<<2) /* ...)... */ 503 #define ONIG_SYN_ALLOW_INVALID_INTERVAL (1U<<3) /* {??? */ 504 #define ONIG_SYN_ALLOW_INTERVAL_LOW_ABBREV (1U<<4) /* {,n} => {0,n} */ 505 #define ONIG_SYN_STRICT_CHECK_BACKREF (1U<<5) /* /(\1)/,/\1()/ ..*/ 506 #define ONIG_SYN_DIFFERENT_LEN_ALT_LOOK_BEHIND (1U<<6) /* (?<=a|bc) */ 507 #define ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP (1U<<7) /* see doc/RE */ 508 #define ONIG_SYN_ALLOW_MULTIPLEX_DEFINITION_NAME (1U<<8) /* (?<x>)(?<x>) */ 509 #define ONIG_SYN_FIXED_INTERVAL_IS_GREEDY_ONLY (1U<<9) /* a{n}?=(?:a{n})? */ 510 511 /* syntax (behavior) in char class [...] */ 512 #define ONIG_SYN_NOT_NEWLINE_IN_NEGATIVE_CC (1U<<20) /* [^...] */ 513 #define ONIG_SYN_BACKSLASH_ESCAPE_IN_CC (1U<<21) /* [..\w..] etc.. */ 514 #define ONIG_SYN_ALLOW_EMPTY_RANGE_IN_CC (1U<<22) 515 #define ONIG_SYN_ALLOW_DOUBLE_RANGE_OP_IN_CC (1U<<23) /* [0-9-a]=[0-9\-a] */ 516 /* syntax (behavior) warning */ 517 #define ONIG_SYN_WARN_CC_OP_NOT_ESCAPED (1U<<24) /* [,-,] */ 518 #define ONIG_SYN_WARN_REDUNDANT_NESTED_REPEAT (1U<<25) /* (?:a*)+ */ 519 520 /* meta character specifiers (onig_set_meta_char()) */ 521 #define ONIG_META_CHAR_ESCAPE 0 522 #define ONIG_META_CHAR_ANYCHAR 1 523 #define ONIG_META_CHAR_ANYTIME 2 524 #define ONIG_META_CHAR_ZERO_OR_ONE_TIME 3 525 #define ONIG_META_CHAR_ONE_OR_MORE_TIME 4 526 #define ONIG_META_CHAR_ANYCHAR_ANYTIME 5 527 528 #define ONIG_INEFFECTIVE_META_CHAR 0 529 530 /* error codes */ 531 #define ONIG_IS_PATTERN_ERROR(ecode) ((ecode) <= -100 && (ecode) > -1000) 532 /* normal return */ 533 #define ONIG_NORMAL 0 534 #define ONIG_MISMATCH -1 535 #define ONIG_NO_SUPPORT_CONFIG -2 536 #define ONIG_ABORT -3 537 538 /* internal error */ 539 #define ONIGERR_MEMORY -5 540 #define ONIGERR_TYPE_BUG -6 541 #define ONIGERR_PARSER_BUG -11 542 #define ONIGERR_STACK_BUG -12 543 #define ONIGERR_UNDEFINED_BYTECODE -13 544 #define ONIGERR_UNEXPECTED_BYTECODE -14 545 #define ONIGERR_MATCH_STACK_LIMIT_OVER -15 546 #define ONIGERR_PARSE_DEPTH_LIMIT_OVER -16 547 #define ONIGERR_RETRY_LIMIT_IN_MATCH_OVER -17 548 #define ONIGERR_DEFAULT_ENCODING_IS_NOT_SETTED -21 549 #define ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR -22 550 #define ONIGERR_FAIL_TO_INITIALIZE -23 551 /* general error */ 552 #define ONIGERR_INVALID_ARGUMENT -30 553 /* syntax error */ 554 #define ONIGERR_END_PATTERN_AT_LEFT_BRACE -100 555 #define ONIGERR_END_PATTERN_AT_LEFT_BRACKET -101 556 #define ONIGERR_EMPTY_CHAR_CLASS -102 557 #define ONIGERR_PREMATURE_END_OF_CHAR_CLASS -103 558 #define ONIGERR_END_PATTERN_AT_ESCAPE -104 559 #define ONIGERR_END_PATTERN_AT_META -105 560 #define ONIGERR_END_PATTERN_AT_CONTROL -106 561 #define ONIGERR_META_CODE_SYNTAX -108 562 #define ONIGERR_CONTROL_CODE_SYNTAX -109 563 #define ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE -110 564 #define ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE -111 565 #define ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS -112 566 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED -113 567 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID -114 568 #define ONIGERR_NESTED_REPEAT_OPERATOR -115 569 #define ONIGERR_UNMATCHED_CLOSE_PARENTHESIS -116 570 #define ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS -117 571 #define ONIGERR_END_PATTERN_IN_GROUP -118 572 #define ONIGERR_UNDEFINED_GROUP_OPTION -119 573 #define ONIGERR_INVALID_POSIX_BRACKET_TYPE -121 574 #define ONIGERR_INVALID_LOOK_BEHIND_PATTERN -122 575 #define ONIGERR_INVALID_REPEAT_RANGE_PATTERN -123 576 /* values error (syntax error) */ 577 #define ONIGERR_TOO_BIG_NUMBER -200 578 #define ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE -201 579 #define ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE -202 580 #define ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS -203 581 #define ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE -204 582 #define ONIGERR_TOO_MANY_MULTI_BYTE_RANGES -205 583 #define ONIGERR_TOO_SHORT_MULTI_BYTE_STRING -206 584 #define ONIGERR_TOO_BIG_BACKREF_NUMBER -207 585 #define ONIGERR_INVALID_BACKREF -208 586 #define ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED -209 587 #define ONIGERR_TOO_MANY_CAPTURES -210 588 #define ONIGERR_TOO_LONG_WIDE_CHAR_VALUE -212 589 #define ONIGERR_EMPTY_GROUP_NAME -214 590 #define ONIGERR_INVALID_GROUP_NAME -215 591 #define ONIGERR_INVALID_CHAR_IN_GROUP_NAME -216 592 #define ONIGERR_UNDEFINED_NAME_REFERENCE -217 593 #define ONIGERR_UNDEFINED_GROUP_REFERENCE -218 594 #define ONIGERR_MULTIPLEX_DEFINED_NAME -219 595 #define ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL -220 596 #define ONIGERR_NEVER_ENDING_RECURSION -221 597 #define ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY -222 598 #define ONIGERR_INVALID_CHAR_PROPERTY_NAME -223 599 #define ONIGERR_INVALID_IF_ELSE_SYNTAX -224 600 #define ONIGERR_INVALID_ABSENT_GROUP_PATTERN -225 601 #define ONIGERR_INVALID_ABSENT_GROUP_GENERATOR_PATTERN -226 602 #define ONIGERR_INVALID_CALLOUT_PATTERN -227 603 #define ONIGERR_INVALID_CALLOUT_NAME -228 604 #define ONIGERR_UNDEFINED_CALLOUT_NAME -229 605 #define ONIGERR_INVALID_CALLOUT_BODY -230 606 #define ONIGERR_INVALID_CALLOUT_TAG_NAME -231 607 #define ONIGERR_INVALID_CALLOUT_ARG -232 608 #define ONIGERR_INVALID_CODE_POINT_VALUE -400 609 #define ONIGERR_INVALID_WIDE_CHAR_VALUE -400 610 #define ONIGERR_TOO_BIG_WIDE_CHAR_VALUE -401 611 #define ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION -402 612 #define ONIGERR_INVALID_COMBINATION_OF_OPTIONS -403 613 #define ONIGERR_TOO_MANY_USER_DEFINED_OBJECTS -404 614 #define ONIGERR_TOO_LONG_PROPERTY_NAME -405 615 #define ONIGERR_LIBRARY_IS_NOT_INITIALIZED -500 616 617 /* errors related to thread */ 618 /* #define ONIGERR_OVER_THREAD_PASS_LIMIT_COUNT -1001 */ 619 620 621 /* must be smaller than MEM_STATUS_BITS_NUM (unsigned int * 8) */ 622 #define ONIG_MAX_CAPTURE_HISTORY_GROUP 31 623 #define ONIG_IS_CAPTURE_HISTORY_GROUP(r, i) \ 624 ((i) <= ONIG_MAX_CAPTURE_HISTORY_GROUP && (r)->list && (r)->list[i]) 625 626 typedef struct OnigCaptureTreeNodeStruct { 627 int group; /* group number */ 628 int beg; 629 int end; 630 int allocated; 631 int num_childs; 632 struct OnigCaptureTreeNodeStruct** childs; 633 } OnigCaptureTreeNode; 634 635 /* match result region type */ 636 struct re_registers { 637 int allocated; 638 int num_regs; 639 int* beg; 640 int* end; 641 /* extended */ 642 OnigCaptureTreeNode* history_root; /* capture history tree root */ 643 }; 644 645 /* capture tree traverse */ 646 #define ONIG_TRAVERSE_CALLBACK_AT_FIRST 1 647 #define ONIG_TRAVERSE_CALLBACK_AT_LAST 2 648 #define ONIG_TRAVERSE_CALLBACK_AT_BOTH \ 649 ( ONIG_TRAVERSE_CALLBACK_AT_FIRST | ONIG_TRAVERSE_CALLBACK_AT_LAST ) 650 651 652 #define ONIG_REGION_NOTPOS -1 653 654 typedef struct re_registers OnigRegion; 655 656 typedef struct { 657 OnigEncoding enc; 658 OnigUChar* par; 659 OnigUChar* par_end; 660 } OnigErrorInfo; 661 662 typedef struct { 663 int lower; 664 int upper; 665 } OnigRepeatRange; 666 667 typedef void (*OnigWarnFunc) P_((const char* s)); 668 extern void onig_null_warn P_((const char* s)); 669 #define ONIG_NULL_WARN onig_null_warn 670 671 #define ONIG_CHAR_TABLE_SIZE 256 672 673 struct re_pattern_buffer; 674 typedef struct re_pattern_buffer OnigRegexType; 675 typedef OnigRegexType* OnigRegex; 676 677 #ifndef ONIG_ESCAPE_REGEX_T_COLLISION 678 typedef OnigRegexType regex_t; 679 #endif 680 681 682 typedef struct { 683 int num_of_elements; 684 OnigEncoding pattern_enc; 685 OnigEncoding target_enc; 686 OnigSyntaxType* syntax; 687 OnigOptionType option; 688 OnigCaseFoldType case_fold_flag; 689 } OnigCompileInfo; 690 691 692 /* types for callout */ 693 typedef enum { 694 ONIG_CALLOUT_IN_PROGRESS = 1, /* 1<<0 */ 695 ONIG_CALLOUT_IN_RETRACTION = 2 /* 1<<1 */ 696 } OnigCalloutIn; 697 698 #define ONIG_CALLOUT_IN_BOTH (ONIG_CALLOUT_IN_PROGRESS | ONIG_CALLOUT_IN_RETRACTION) 699 700 typedef enum { 701 ONIG_CALLOUT_OF_CONTENTS = 0, 702 ONIG_CALLOUT_OF_NAME = 1 703 } OnigCalloutOf; 704 705 typedef enum { 706 ONIG_CALLOUT_TYPE_SINGLE = 0, 707 ONIG_CALLOUT_TYPE_START_CALL = 1, 708 ONIG_CALLOUT_TYPE_BOTH_CALL = 2, 709 ONIG_CALLOUT_TYPE_START_MARK_END_CALL = 3, 710 } OnigCalloutType; 711 712 713 #define ONIG_NON_NAME_ID -1 714 #define ONIG_NON_CALLOUT_NUM 0 715 716 #define ONIG_CALLOUT_MAX_ARGS_NUM 4 717 #define ONIG_CALLOUT_DATA_SLOT_NUM 5 718 719 struct OnigCalloutArgsStruct; 720 typedef struct OnigCalloutArgsStruct OnigCalloutArgs; 721 722 typedef int (*OnigCalloutFunc)(OnigCalloutArgs* args, void* user_data); 723 724 /* callout function return values (less than -1: error code) */ 725 typedef enum { 726 ONIG_CALLOUT_FAIL = 1, 727 ONIG_CALLOUT_SUCCESS = 0 728 } OnigCalloutResult; 729 730 typedef enum { 731 ONIG_TYPE_VOID = 0, 732 ONIG_TYPE_LONG = 1<<0, 733 ONIG_TYPE_CHAR = 1<<1, 734 ONIG_TYPE_STRING = 1<<2, 735 ONIG_TYPE_POINTER = 1<<3, 736 ONIG_TYPE_TAG = 1<<4, 737 } OnigType; 738 739 typedef union { 740 long l; 741 OnigCodePoint c; 742 struct { 743 OnigUChar* start; 744 OnigUChar* end; 745 } s; 746 void* p; 747 int tag; /* tag -> callout_num */ 748 } OnigValue; 749 750 751 struct OnigMatchParamStruct; 752 typedef struct OnigMatchParamStruct OnigMatchParam; 753 754 755 /* Oniguruma Native API */ 756 757 ONIG_EXTERN 758 int onig_initialize P_((OnigEncoding encodings[], int number_of_encodings)); 759 /* onig_init(): deprecated function. Use onig_initialize(). */ 760 ONIG_EXTERN 761 int onig_init P_((void)); 762 ONIG_EXTERN 763 int onig_error_code_to_str PV_((OnigUChar* s, int err_code, ...)); 764 ONIG_EXTERN 765 void onig_set_warn_func P_((OnigWarnFunc f)); 766 ONIG_EXTERN 767 void onig_set_verb_warn_func P_((OnigWarnFunc f)); 768 ONIG_EXTERN 769 int onig_new P_((OnigRegex*, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo)); 770 ONIG_EXTERN 771 int onig_reg_init P_((OnigRegex reg, OnigOptionType option, OnigCaseFoldType case_fold_flag, OnigEncoding enc, OnigSyntaxType* syntax)); 772 int onig_new_without_alloc P_((OnigRegex, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo)); 773 ONIG_EXTERN 774 int onig_new_deluxe P_((OnigRegex* reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo)); 775 ONIG_EXTERN 776 void onig_free P_((OnigRegex)); 777 ONIG_EXTERN 778 void onig_free_body P_((OnigRegex)); 779 ONIG_EXTERN 780 int onig_scan(OnigRegex reg, const OnigUChar* str, const OnigUChar* end, OnigRegion* region, OnigOptionType option, int (*scan_callback)(int, int, OnigRegion*, void*), void* callback_arg); 781 ONIG_EXTERN 782 int onig_search P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option)); 783 ONIG_EXTERN 784 int onig_search_with_param P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option, OnigMatchParam* mp)); 785 ONIG_EXTERN 786 int onig_match P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option)); 787 ONIG_EXTERN 788 int onig_match_with_param P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option, OnigMatchParam* mp)); 789 ONIG_EXTERN 790 OnigRegion* onig_region_new P_((void)); 791 ONIG_EXTERN 792 void onig_region_init P_((OnigRegion* region)); 793 ONIG_EXTERN 794 void onig_region_free P_((OnigRegion* region, int free_self)); 795 ONIG_EXTERN 796 void onig_region_copy P_((OnigRegion* to, OnigRegion* from)); 797 ONIG_EXTERN 798 void onig_region_clear P_((OnigRegion* region)); 799 ONIG_EXTERN 800 int onig_region_resize P_((OnigRegion* region, int n)); 801 ONIG_EXTERN 802 int onig_region_set P_((OnigRegion* region, int at, int beg, int end)); 803 ONIG_EXTERN 804 int onig_name_to_group_numbers P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, int** nums)); 805 ONIG_EXTERN 806 int onig_name_to_backref_number P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, OnigRegion *region)); 807 ONIG_EXTERN 808 int onig_foreach_name P_((OnigRegex reg, int (*func)(const OnigUChar*, const OnigUChar*,int,int*,OnigRegex,void*), void* arg)); 809 ONIG_EXTERN 810 int onig_number_of_names P_((OnigRegex reg)); 811 ONIG_EXTERN 812 int onig_number_of_captures P_((OnigRegex reg)); 813 ONIG_EXTERN 814 int onig_number_of_capture_histories P_((OnigRegex reg)); 815 ONIG_EXTERN 816 OnigCaptureTreeNode* onig_get_capture_tree P_((OnigRegion* region)); 817 ONIG_EXTERN 818 int onig_capture_tree_traverse P_((OnigRegion* region, int at, int(*callback_func)(int,int,int,int,int,void*), void* arg)); 819 ONIG_EXTERN 820 int onig_noname_group_capture_is_active P_((OnigRegex reg)); 821 ONIG_EXTERN 822 OnigEncoding onig_get_encoding P_((OnigRegex reg)); 823 ONIG_EXTERN 824 OnigOptionType onig_get_options P_((OnigRegex reg)); 825 ONIG_EXTERN 826 OnigCaseFoldType onig_get_case_fold_flag P_((OnigRegex reg)); 827 ONIG_EXTERN 828 OnigSyntaxType* onig_get_syntax P_((OnigRegex reg)); 829 ONIG_EXTERN 830 int onig_set_default_syntax P_((OnigSyntaxType* syntax)); 831 ONIG_EXTERN 832 void onig_copy_syntax P_((OnigSyntaxType* to, OnigSyntaxType* from)); 833 ONIG_EXTERN 834 unsigned int onig_get_syntax_op P_((OnigSyntaxType* syntax)); 835 ONIG_EXTERN 836 unsigned int onig_get_syntax_op2 P_((OnigSyntaxType* syntax)); 837 ONIG_EXTERN 838 unsigned int onig_get_syntax_behavior P_((OnigSyntaxType* syntax)); 839 ONIG_EXTERN 840 OnigOptionType onig_get_syntax_options P_((OnigSyntaxType* syntax)); 841 ONIG_EXTERN 842 void onig_set_syntax_op P_((OnigSyntaxType* syntax, unsigned int op)); 843 ONIG_EXTERN 844 void onig_set_syntax_op2 P_((OnigSyntaxType* syntax, unsigned int op2)); 845 ONIG_EXTERN 846 void onig_set_syntax_behavior P_((OnigSyntaxType* syntax, unsigned int behavior)); 847 ONIG_EXTERN 848 void onig_set_syntax_options P_((OnigSyntaxType* syntax, OnigOptionType options)); 849 ONIG_EXTERN 850 int onig_set_meta_char P_((OnigSyntaxType* syntax, unsigned int what, OnigCodePoint code)); 851 ONIG_EXTERN 852 void onig_copy_encoding P_((OnigEncoding to, OnigEncoding from)); 853 ONIG_EXTERN 854 OnigCaseFoldType onig_get_default_case_fold_flag P_((void)); 855 ONIG_EXTERN 856 int onig_set_default_case_fold_flag P_((OnigCaseFoldType case_fold_flag)); 857 ONIG_EXTERN 858 unsigned int onig_get_match_stack_limit_size P_((void)); 859 ONIG_EXTERN 860 int onig_set_match_stack_limit_size P_((unsigned int size)); 861 ONIG_EXTERN 862 unsigned long onig_get_retry_limit_in_match P_((void)); 863 ONIG_EXTERN 864 int onig_set_retry_limit_in_match P_((unsigned long n)); 865 ONIG_EXTERN 866 unsigned int onig_get_parse_depth_limit P_((void)); 867 ONIG_EXTERN 868 int onig_set_capture_num_limit P_((int num)); 869 ONIG_EXTERN 870 int onig_set_parse_depth_limit P_((unsigned int depth)); 871 ONIG_EXTERN 872 int onig_unicode_define_user_property P_((const char* name, OnigCodePoint* ranges)); 873 ONIG_EXTERN 874 int onig_end P_((void)); 875 ONIG_EXTERN 876 const char* onig_version P_((void)); 877 ONIG_EXTERN 878 const char* onig_copyright P_((void)); 879 880 /* for OnigMatchParam */ 881 ONIG_EXTERN 882 OnigMatchParam* onig_new_match_param P_((void)); 883 ONIG_EXTERN 884 void onig_free_match_param P_((OnigMatchParam* p)); 885 ONIG_EXTERN 886 void onig_free_match_param_content P_((OnigMatchParam* p)); 887 ONIG_EXTERN 888 int onig_initialize_match_param P_((OnigMatchParam* mp)); 889 ONIG_EXTERN 890 int onig_set_match_stack_limit_size_of_match_param P_((OnigMatchParam* param, unsigned int limit)); 891 ONIG_EXTERN 892 int onig_set_retry_limit_in_match_of_match_param P_((OnigMatchParam* param, unsigned long limit)); 893 ONIG_EXTERN 894 int onig_set_progress_callout_of_match_param P_((OnigMatchParam* param, OnigCalloutFunc f)); 895 ONIG_EXTERN 896 int onig_set_retraction_callout_of_match_param P_((OnigMatchParam* param, OnigCalloutFunc f)); 897 ONIG_EXTERN 898 int onig_set_callout_user_data_of_match_param P_((OnigMatchParam* param, void* user_data)); 899 900 /* for callout functions */ 901 ONIG_EXTERN 902 OnigCalloutFunc onig_get_progress_callout P_((void)); 903 ONIG_EXTERN 904 int onig_set_progress_callout P_((OnigCalloutFunc f)); 905 ONIG_EXTERN 906 OnigCalloutFunc onig_get_retraction_callout P_((void)); 907 ONIG_EXTERN 908 int onig_set_retraction_callout P_((OnigCalloutFunc f)); 909 ONIG_EXTERN 910 int onig_set_callout_of_name P_((OnigEncoding enc, OnigCalloutType type, OnigUChar* name, OnigUChar* name_end, int callout_in, OnigCalloutFunc callout, OnigCalloutFunc end_callout, int arg_num, unsigned int arg_types[], int optional_arg_num, OnigValue opt_defaults[])); 911 ONIG_EXTERN 912 OnigUChar* onig_get_callout_name_by_name_id P_((int id)); 913 ONIG_EXTERN 914 int onig_get_callout_num_by_tag P_((OnigRegex reg, const OnigUChar* tag, const OnigUChar* tag_end)); 915 ONIG_EXTERN 916 int onig_get_callout_data_by_tag P_((OnigRegex reg, OnigMatchParam* mp, const OnigUChar* tag, const OnigUChar* tag_end, int slot, OnigType* type, OnigValue* val)); 917 ONIG_EXTERN 918 int onig_set_callout_data_by_tag P_((OnigRegex reg, OnigMatchParam* mp, const OnigUChar* tag, const OnigUChar* tag_end, int slot, OnigType type, OnigValue* val)); 919 920 /* used in callout functions */ 921 ONIG_EXTERN 922 int onig_get_callout_num_by_callout_args P_((OnigCalloutArgs* args)); 923 ONIG_EXTERN 924 OnigCalloutIn onig_get_callout_in_by_callout_args P_((OnigCalloutArgs* args)); 925 ONIG_EXTERN 926 int onig_get_name_id_by_callout_args P_((OnigCalloutArgs* args)); 927 ONIG_EXTERN 928 const OnigUChar* onig_get_contents_by_callout_args P_((OnigCalloutArgs* args)); 929 ONIG_EXTERN 930 const OnigUChar* onig_get_contents_end_by_callout_args P_((OnigCalloutArgs* args)); 931 ONIG_EXTERN 932 int onig_get_args_num_by_callout_args P_((OnigCalloutArgs* args)); 933 ONIG_EXTERN 934 int onig_get_passed_args_num_by_callout_args P_((OnigCalloutArgs* args)); 935 ONIG_EXTERN 936 int onig_get_arg_by_callout_args P_((OnigCalloutArgs* args, int index, OnigType* type, OnigValue* val)); 937 ONIG_EXTERN 938 const OnigUChar* onig_get_string_by_callout_args P_((OnigCalloutArgs* args)); 939 ONIG_EXTERN 940 const OnigUChar* onig_get_string_end_by_callout_args P_((OnigCalloutArgs* args)); 941 ONIG_EXTERN 942 const OnigUChar* onig_get_start_by_callout_args P_((OnigCalloutArgs* args)); 943 ONIG_EXTERN 944 const OnigUChar* onig_get_right_range_by_callout_args P_((OnigCalloutArgs* args)); 945 ONIG_EXTERN 946 const OnigUChar* onig_get_current_by_callout_args P_((OnigCalloutArgs* args)); 947 ONIG_EXTERN 948 OnigRegex onig_get_regex_by_callout_args P_((OnigCalloutArgs* args)); 949 ONIG_EXTERN 950 unsigned long onig_get_retry_counter_by_callout_args P_((OnigCalloutArgs* args)); 951 ONIG_EXTERN 952 int onig_callout_tag_is_exist_at_callout_num P_((OnigRegex reg, int callout_num)); 953 ONIG_EXTERN 954 const OnigUChar* onig_get_callout_tag_start P_((OnigRegex reg, int callout_num)); 955 ONIG_EXTERN 956 const OnigUChar* onig_get_callout_tag_end P_((OnigRegex reg, int callout_num)); 957 ONIG_EXTERN 958 int onig_get_callout_data_dont_clear_old P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType* type, OnigValue* val)); 959 ONIG_EXTERN 960 int onig_get_callout_data_by_callout_args_self_dont_clear_old P_((OnigCalloutArgs* args, int slot, OnigType* type, OnigValue* val)); 961 ONIG_EXTERN 962 int onig_get_callout_data P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType* type, OnigValue* val)); 963 ONIG_EXTERN 964 int onig_get_callout_data_by_callout_args P_((OnigCalloutArgs* args, int callout_num, int slot, OnigType* type, OnigValue* val)); 965 ONIG_EXTERN 966 int onig_get_callout_data_by_callout_args_self P_((OnigCalloutArgs* args, int slot, OnigType* type, OnigValue* val)); 967 ONIG_EXTERN 968 int onig_set_callout_data P_((OnigRegex reg, OnigMatchParam* mp, int callout_num, int slot, OnigType type, OnigValue* val)); 969 ONIG_EXTERN 970 int onig_set_callout_data_by_callout_args P_((OnigCalloutArgs* args, int callout_num, int slot, OnigType type, OnigValue* val)); 971 ONIG_EXTERN 972 int onig_set_callout_data_by_callout_args_self P_((OnigCalloutArgs* args, int slot, OnigType type, OnigValue* val)); 973 ONIG_EXTERN 974 int onig_get_capture_range_in_callout P_((OnigCalloutArgs* args, int mem_num, int* begin, int* end)); 975 ONIG_EXTERN 976 int onig_get_used_stack_size_in_callout P_((OnigCalloutArgs* args, int* used_num, int* used_bytes)); 977 978 /* builtin callout functions */ 979 ONIG_EXTERN 980 int onig_builtin_fail P_((OnigCalloutArgs* args, void* user_data)); 981 ONIG_EXTERN 982 int onig_builtin_mismatch P_((OnigCalloutArgs* args, void* user_data)); 983 ONIG_EXTERN 984 int onig_builtin_error P_((OnigCalloutArgs* args, void* user_data)); 985 ONIG_EXTERN 986 int onig_builtin_count P_((OnigCalloutArgs* args, void* user_data)); 987 ONIG_EXTERN 988 int onig_builtin_total_count P_((OnigCalloutArgs* args, void* user_data)); 989 ONIG_EXTERN 990 int onig_builtin_max P_((OnigCalloutArgs* args, void* user_data)); 991 ONIG_EXTERN 992 int onig_builtin_cmp P_((OnigCalloutArgs* args, void* user_data)); 993 994 ONIG_EXTERN 995 int onig_setup_builtin_monitors_by_ascii_encoded_name P_((void* fp)); 996 997 #ifdef __cplusplus 998 } 999 #endif 1000 1001 #endif /* ONIGURUMA_H */ 1002