1 #ifndef ONIGURUMA_H 2 #define ONIGURUMA_H 3 /********************************************************************** 4 oniguruma.h - Oniguruma (regular expression library) 5 **********************************************************************/ 6 /*- 7 * Copyright (c) 2002-2007 K.Kosako <sndgk393 AT ybb DOT ne DOT jp> 8 * All rights reserved. 9 * 10 * Redistribution and use in source and binary forms, with or without 11 * modification, are permitted provided that the following conditions 12 * are met: 13 * 1. Redistributions of source code must retain the above copyright 14 * notice, this list of conditions and the following disclaimer. 15 * 2. Redistributions in binary form must reproduce the above copyright 16 * notice, this list of conditions and the following disclaimer in the 17 * documentation and/or other materials provided with the distribution. 18 * 19 * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND 20 * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 21 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE 22 * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE 23 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL 24 * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS 25 * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) 26 * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT 27 * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY 28 * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF 29 * SUCH DAMAGE. 30 */ 31 32 #include "../php_onig_compat.h" 33 34 #ifdef __cplusplus 35 extern "C" { 36 #endif 37 38 #define ONIGURUMA 39 #define ONIGURUMA_VERSION_MAJOR 4 40 #define ONIGURUMA_VERSION_MINOR 7 41 #define ONIGURUMA_VERSION_TEENY 1 42 43 #ifdef __cplusplus 44 # ifndef HAVE_PROTOTYPES 45 # define HAVE_PROTOTYPES 1 46 # endif 47 # ifndef HAVE_STDARG_PROTOTYPES 48 # define HAVE_STDARG_PROTOTYPES 1 49 # endif 50 #endif 51 52 /* escape Mac OS X/Xcode 2.4/gcc 4.0.1 problem */ 53 #if defined(__APPLE__) && defined(__GNUC__) && __GNUC__ >= 4 54 # ifndef HAVE_STDARG_PROTOTYPES 55 # define HAVE_STDARG_PROTOTYPES 1 56 # endif 57 #endif 58 59 #ifndef P_ 60 #if defined(__STDC__) || defined(_WIN32) 61 # define P_(args) args 62 #else 63 # define P_(args) () 64 #endif 65 #endif 66 67 #ifndef PV_ 68 #ifdef HAVE_STDARG_PROTOTYPES 69 # define PV_(args) args 70 #else 71 # define PV_(args) () 72 #endif 73 #endif 74 75 #ifndef ONIG_EXTERN 76 #if defined(_WIN32) && !defined(__GNUC__) 77 #if defined(EXPORT) || defined(RUBY_EXPORT) 78 #define ONIG_EXTERN extern __declspec(dllexport) 79 #else 80 #define ONIG_EXTERN extern __declspec(dllimport) 81 #endif 82 #endif 83 #endif 84 85 #ifndef ONIG_EXTERN 86 #define ONIG_EXTERN extern 87 #endif 88 89 /* PART: character encoding */ 90 91 #ifndef ONIG_ESCAPE_UCHAR_COLLISION 92 #define UChar OnigUChar 93 #endif 94 95 typedef unsigned char OnigUChar; 96 typedef unsigned long OnigCodePoint; 97 typedef unsigned int OnigDistance; 98 99 #define ONIG_INFINITE_DISTANCE ~((OnigDistance )0) 100 101 /* ambiguous match flag */ 102 typedef unsigned int OnigAmbigType; 103 104 ONIG_EXTERN OnigAmbigType OnigDefaultAmbigFlag; 105 106 #define ONIGENC_AMBIGUOUS_MATCH_NONE 0 107 #define ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE (1<<0) 108 #define ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE (1<<1) 109 110 #define ONIGENC_AMBIGUOUS_MATCH_LIMIT (1<<1) 111 112 #define ONIGENC_AMBIGUOUS_MATCH_FULL \ 113 ( ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE | ONIGENC_AMBIGUOUS_MATCH_NONASCII_CASE ) 114 #define ONIGENC_AMBIGUOUS_MATCH_DEFAULT OnigDefaultAmbigFlag 115 116 117 #define ONIGENC_MAX_COMP_AMBIG_CODE_LEN 3 118 #define ONIGENC_MAX_COMP_AMBIG_CODE_ITEM_NUM 4 119 120 /* code range */ 121 #define ONIGENC_CODE_RANGE_NUM(range) ((int )range[0]) 122 #define ONIGENC_CODE_RANGE_FROM(range,i) range[((i)*2) + 1] 123 #define ONIGENC_CODE_RANGE_TO(range,i) range[((i)*2) + 2] 124 125 typedef struct { 126 int len; 127 OnigCodePoint code[ONIGENC_MAX_COMP_AMBIG_CODE_LEN]; 128 } OnigCompAmbigCodeItem; 129 130 typedef struct { 131 int n; 132 OnigCodePoint code; 133 OnigCompAmbigCodeItem items[ONIGENC_MAX_COMP_AMBIG_CODE_ITEM_NUM]; 134 } OnigCompAmbigCodes; 135 136 typedef struct { 137 OnigCodePoint from; 138 OnigCodePoint to; 139 } OnigPairAmbigCodes; 140 141 typedef struct { 142 OnigCodePoint esc; 143 OnigCodePoint anychar; 144 OnigCodePoint anytime; 145 OnigCodePoint zero_or_one_time; 146 OnigCodePoint one_or_more_time; 147 OnigCodePoint anychar_anytime; 148 } OnigMetaCharTableType; 149 150 151 #if defined(RUBY_PLATFORM) && defined(M17N_H) 152 153 #define ONIG_RUBY_M17N 154 typedef m17n_encoding* OnigEncoding; 155 156 #else 157 158 typedef struct { 159 int (*mbc_enc_len)(const OnigUChar* p); 160 const char* name; 161 int max_enc_len; 162 int min_enc_len; 163 OnigAmbigType support_ambig_flag; 164 OnigMetaCharTableType meta_char_table; 165 int (*is_mbc_newline)(const OnigUChar* p, const OnigUChar* end); 166 OnigCodePoint (*mbc_to_code)(const OnigUChar* p, const OnigUChar* end); 167 int (*code_to_mbclen)(OnigCodePoint code); 168 int (*code_to_mbc)(OnigCodePoint code, OnigUChar *buf); 169 int (*mbc_to_normalize)(OnigAmbigType flag, const OnigUChar** pp, const OnigUChar* end, OnigUChar* to); 170 int (*is_mbc_ambiguous)(OnigAmbigType flag, const OnigUChar** pp, const OnigUChar* end); 171 int (*get_all_pair_ambig_codes)(OnigAmbigType flag, const OnigPairAmbigCodes** acs); 172 int (*get_all_comp_ambig_codes)(OnigAmbigType flag, const OnigCompAmbigCodes** acs); 173 int (*is_code_ctype)(OnigCodePoint code, unsigned int ctype); 174 int (*get_ctype_code_range)(int ctype, const OnigCodePoint* sb_range[], const OnigCodePoint* mb_range[]); 175 OnigUChar* (*left_adjust_char_head)(const OnigUChar* start, const OnigUChar* p); 176 int (*is_allowed_reverse_match)(const OnigUChar* p, const OnigUChar* end); 177 } OnigEncodingType; 178 179 typedef OnigEncodingType* OnigEncoding; 180 181 ONIG_EXTERN OnigEncodingType OnigEncodingASCII; 182 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_1; 183 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_2; 184 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_3; 185 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_4; 186 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_5; 187 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_6; 188 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_7; 189 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_8; 190 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_9; 191 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_10; 192 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_11; 193 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_13; 194 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_14; 195 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_15; 196 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_16; 197 ONIG_EXTERN OnigEncodingType OnigEncodingUTF8; 198 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_BE; 199 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_LE; 200 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_BE; 201 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_LE; 202 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_JP; 203 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_TW; 204 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_KR; 205 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_CN; 206 ONIG_EXTERN OnigEncodingType OnigEncodingSJIS; 207 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8; 208 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8_R; 209 ONIG_EXTERN OnigEncodingType OnigEncodingBIG5; 210 ONIG_EXTERN OnigEncodingType OnigEncodingGB18030; 211 212 #define ONIG_ENCODING_ASCII (&OnigEncodingASCII) 213 #define ONIG_ENCODING_ISO_8859_1 (&OnigEncodingISO_8859_1) 214 #define ONIG_ENCODING_ISO_8859_2 (&OnigEncodingISO_8859_2) 215 #define ONIG_ENCODING_ISO_8859_3 (&OnigEncodingISO_8859_3) 216 #define ONIG_ENCODING_ISO_8859_4 (&OnigEncodingISO_8859_4) 217 #define ONIG_ENCODING_ISO_8859_5 (&OnigEncodingISO_8859_5) 218 #define ONIG_ENCODING_ISO_8859_6 (&OnigEncodingISO_8859_6) 219 #define ONIG_ENCODING_ISO_8859_7 (&OnigEncodingISO_8859_7) 220 #define ONIG_ENCODING_ISO_8859_8 (&OnigEncodingISO_8859_8) 221 #define ONIG_ENCODING_ISO_8859_9 (&OnigEncodingISO_8859_9) 222 #define ONIG_ENCODING_ISO_8859_10 (&OnigEncodingISO_8859_10) 223 #define ONIG_ENCODING_ISO_8859_11 (&OnigEncodingISO_8859_11) 224 #define ONIG_ENCODING_ISO_8859_13 (&OnigEncodingISO_8859_13) 225 #define ONIG_ENCODING_ISO_8859_14 (&OnigEncodingISO_8859_14) 226 #define ONIG_ENCODING_ISO_8859_15 (&OnigEncodingISO_8859_15) 227 #define ONIG_ENCODING_ISO_8859_16 (&OnigEncodingISO_8859_16) 228 #define ONIG_ENCODING_UTF8 (&OnigEncodingUTF8) 229 #define ONIG_ENCODING_UTF16_BE (&OnigEncodingUTF16_BE) 230 #define ONIG_ENCODING_UTF16_LE (&OnigEncodingUTF16_LE) 231 #define ONIG_ENCODING_UTF32_BE (&OnigEncodingUTF32_BE) 232 #define ONIG_ENCODING_UTF32_LE (&OnigEncodingUTF32_LE) 233 #define ONIG_ENCODING_EUC_JP (&OnigEncodingEUC_JP) 234 #define ONIG_ENCODING_EUC_TW (&OnigEncodingEUC_TW) 235 #define ONIG_ENCODING_EUC_KR (&OnigEncodingEUC_KR) 236 #define ONIG_ENCODING_EUC_CN (&OnigEncodingEUC_CN) 237 #define ONIG_ENCODING_SJIS (&OnigEncodingSJIS) 238 #define ONIG_ENCODING_KOI8 (&OnigEncodingKOI8) 239 #define ONIG_ENCODING_KOI8_R (&OnigEncodingKOI8_R) 240 #define ONIG_ENCODING_BIG5 (&OnigEncodingBIG5) 241 #define ONIG_ENCODING_GB18030 (&OnigEncodingGB18030) 242 243 #endif /* else RUBY && M17N */ 244 245 #define ONIG_ENCODING_UNDEF ((OnigEncoding )0) 246 247 248 /* work size */ 249 #define ONIGENC_CODE_TO_MBC_MAXLEN 7 250 #define ONIGENC_MBC_NORMALIZE_MAXLEN ONIGENC_CODE_TO_MBC_MAXLEN 251 252 /* character types */ 253 #define ONIGENC_CTYPE_NEWLINE (1<< 0) 254 #define ONIGENC_CTYPE_ALPHA (1<< 1) 255 #define ONIGENC_CTYPE_BLANK (1<< 2) 256 #define ONIGENC_CTYPE_CNTRL (1<< 3) 257 #define ONIGENC_CTYPE_DIGIT (1<< 4) 258 #define ONIGENC_CTYPE_GRAPH (1<< 5) 259 #define ONIGENC_CTYPE_LOWER (1<< 6) 260 #define ONIGENC_CTYPE_PRINT (1<< 7) 261 #define ONIGENC_CTYPE_PUNCT (1<< 8) 262 #define ONIGENC_CTYPE_SPACE (1<< 9) 263 #define ONIGENC_CTYPE_UPPER (1<<10) 264 #define ONIGENC_CTYPE_XDIGIT (1<<11) 265 #define ONIGENC_CTYPE_WORD (1<<12) 266 #define ONIGENC_CTYPE_ASCII (1<<13) 267 #define ONIGENC_CTYPE_ALNUM (ONIGENC_CTYPE_ALPHA | ONIGENC_CTYPE_DIGIT) 268 269 #define enc_len(enc,p) ONIGENC_MBC_ENC_LEN(enc, p) 270 271 #define ONIGENC_IS_UNDEF(enc) ((enc) == ONIG_ENCODING_UNDEF) 272 #define ONIGENC_IS_SINGLEBYTE(enc) (ONIGENC_MBC_MAXLEN(enc) == 1) 273 #define ONIGENC_IS_MBC_HEAD(enc,p) (ONIGENC_MBC_ENC_LEN(enc,p) != 1) 274 #define ONIGENC_IS_MBC_ASCII(p) (*(p) < 128) 275 #define ONIGENC_IS_CODE_ASCII(code) ((code) < 128) 276 #define ONIGENC_IS_CODE_SB_WORD(enc,code) \ 277 (ONIGENC_IS_CODE_ASCII(code) && ONIGENC_IS_CODE_WORD(enc,code)) 278 #define ONIGENC_IS_MBC_WORD(enc,s,end) \ 279 ONIGENC_IS_CODE_WORD(enc,ONIGENC_MBC_TO_CODE(enc,s,end)) 280 281 282 #ifdef ONIG_RUBY_M17N 283 284 #include <ctype.h> /* for isblank(), isgraph() */ 285 286 #define ONIGENC_MBC_TO_NORMALIZE(enc,flag,pp,end,buf) \ 287 onigenc_mbc_to_normalize(enc,flag,pp,end,buf) 288 #define ONIGENC_IS_MBC_AMBIGUOUS(enc,flag,pp,end) \ 289 onigenc_is_mbc_ambiguous(enc,flag,pp,end) 290 291 #define ONIGENC_SUPPORT_AMBIG_FLAG(enc) ONIGENC_AMBIGUOUS_MATCH_ASCII_CASE 292 #define ONIGENC_IS_ALLOWED_REVERSE_MATCH(enc,s,end) \ 293 onigenc_is_allowed_reverse_match(enc, s, end) 294 #define ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc,start,s) \ 295 onigenc_get_left_adjust_char_head(enc, start, s) 296 #define ONIGENC_GET_ALL_PAIR_AMBIG_CODES(enc, ambig_flag, acs) 0 297 #define ONIGENC_GET_ALL_COMP_AMBIG_CODES(enc, ambig_flag, acs) 0 298 #define ONIGENC_GET_CTYPE_CODE_RANGE(enc,ctype,sbr,mbr) \ 299 ONIG_NO_SUPPORT_CONFIG 300 #define ONIGENC_MBC_ENC_LEN(enc,p) m17n_mbclen(enc,(int )(*p)) 301 #define ONIGENC_MBC_MAXLEN(enc) m17n_mbmaxlen(enc) 302 #define ONIGENC_MBC_MAXLEN_DIST(enc) \ 303 (ONIGENC_MBC_MAXLEN(enc) > 0 ? ONIGENC_MBC_MAXLEN(enc) \ 304 : ONIG_INFINITE_DISTANCE) 305 #define ONIGENC_MBC_MINLEN(enc) 1 306 #define ONIGENC_MBC_TO_CODE(enc,p,e) m17n_codepoint((enc),(p),(e)) 307 #define ONIGENC_CODE_TO_MBCLEN(enc,code) m17n_codelen((enc),(code)) 308 #define ONIGENC_CODE_TO_MBC(enc,code,buf) onigenc_code_to_mbc(enc, code, buf) 309 310 #if 0 /* !! not supported !! */ 311 #define ONIGENC_IS_MBC_NEWLINE(enc,p,end) 312 #define ONIGENC_STEP_BACK(enc,start,s,n) 313 #endif 314 315 #define ONIGENC_IS_CODE_CTYPE(enc,code,ctype) \ 316 onigenc_is_code_ctype(enc,code,ctype) 317 318 #ifdef isblank 319 # define ONIGENC_IS_CODE_BLANK(enc,code) isblank((int )code) 320 #else 321 # define ONIGENC_IS_CODE_BLANK(enc,code) ((code) == ' ' || (code) == '\t') 322 #endif 323 #ifdef isgraph 324 # define ONIGENC_IS_CODE_GRAPH(enc,code) isgraph((int )code) 325 #else 326 # define ONIGENC_IS_CODE_GRAPH(enc,code) \ 327 (isprint((int )code) && !isspace((int )code)) 328 #endif 329 330 #define ONIGENC_IS_CODE_PRINT(enc,code) m17n_isprint(enc,code) 331 #define ONIGENC_IS_CODE_ALNUM(enc,code) m17n_isalnum(enc,code) 332 #define ONIGENC_IS_CODE_ALPHA(enc,code) m17n_isalpha(enc,code) 333 #define ONIGENC_IS_CODE_LOWER(enc,code) m17n_islower(enc,code) 334 #define ONIGENC_IS_CODE_UPPER(enc,code) m17n_isupper(enc,code) 335 #define ONIGENC_IS_CODE_CNTRL(enc,code) m17n_iscntrl(enc,code) 336 #define ONIGENC_IS_CODE_PUNCT(enc,code) m17n_ispunct(enc,code) 337 #define ONIGENC_IS_CODE_SPACE(enc,code) m17n_isspace(enc,code) 338 #define ONIGENC_IS_CODE_DIGIT(enc,code) m17n_isdigit(enc,code) 339 #define ONIGENC_IS_CODE_XDIGIT(enc,code) m17n_isxdigit(enc,code) 340 #define ONIGENC_IS_CODE_WORD(enc,code) m17n_iswchar(enc,code) 341 342 ONIG_EXTERN 343 int onigenc_is_code_ctype P_((OnigEncoding enc, OnigCodePoint code, int ctype)); 344 ONIG_EXTERN 345 int onigenc_code_to_mbc P_((OnigEncoding enc, OnigCodePoint code, OnigUChar *buf)); 346 ONIG_EXTERN 347 int onigenc_mbc_to_normalize P_((OnigEncoding enc, OnigAmbigType flag, const OnigUChar** pp, const OnigUChar* end, OnigUChar* buf)); 348 ONIG_EXTERN 349 int onigenc_is_mbc_ambiguous P_((OnigEncoding enc, OnigAmbigType flag, const OnigUChar** pp, const OnigUChar* end)); 350 ONIG_EXTERN 351 int onigenc_is_allowed_reverse_match P_((OnigEncoding enc, const OnigUChar* s, const OnigUChar* end)); 352 353 #else /* ONIG_RUBY_M17N */ 354 355 #define ONIGENC_NAME(enc) ((enc)->name) 356 357 #define ONIGENC_MBC_TO_NORMALIZE(enc,flag,pp,end,buf) \ 358 (enc)->mbc_to_normalize(flag,(const OnigUChar** )pp,end,buf) 359 #define ONIGENC_IS_MBC_AMBIGUOUS(enc,flag,pp,end) \ 360 (enc)->is_mbc_ambiguous(flag,(const OnigUChar** )pp,end) 361 #define ONIGENC_SUPPORT_AMBIG_FLAG(enc) ((enc)->support_ambig_flag) 362 #define ONIGENC_IS_ALLOWED_REVERSE_MATCH(enc,s,end) \ 363 (enc)->is_allowed_reverse_match(s,end) 364 #define ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc,start,s) \ 365 (enc)->left_adjust_char_head(start, s) 366 #define ONIGENC_GET_ALL_PAIR_AMBIG_CODES(enc,ambig_flag,acs) \ 367 (enc)->get_all_pair_ambig_codes(ambig_flag,acs) 368 #define ONIGENC_GET_ALL_COMP_AMBIG_CODES(enc,ambig_flag,acs) \ 369 (enc)->get_all_comp_ambig_codes(ambig_flag,acs) 370 #define ONIGENC_STEP_BACK(enc,start,s,n) \ 371 onigenc_step_back((enc),(start),(s),(n)) 372 373 #define ONIGENC_MBC_ENC_LEN(enc,p) (enc)->mbc_enc_len(p) 374 #define ONIGENC_MBC_MAXLEN(enc) ((enc)->max_enc_len) 375 #define ONIGENC_MBC_MAXLEN_DIST(enc) ONIGENC_MBC_MAXLEN(enc) 376 #define ONIGENC_MBC_MINLEN(enc) ((enc)->min_enc_len) 377 #define ONIGENC_IS_MBC_NEWLINE(enc,p,end) (enc)->is_mbc_newline((p),(end)) 378 #define ONIGENC_MBC_TO_CODE(enc,p,end) (enc)->mbc_to_code((p),(end)) 379 #define ONIGENC_CODE_TO_MBCLEN(enc,code) (enc)->code_to_mbclen(code) 380 #define ONIGENC_CODE_TO_MBC(enc,code,buf) (enc)->code_to_mbc(code,buf) 381 382 #define ONIGENC_IS_CODE_CTYPE(enc,code,ctype) (enc)->is_code_ctype(code,ctype) 383 384 #define ONIGENC_IS_CODE_NEWLINE(enc,code) \ 385 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_NEWLINE) 386 #define ONIGENC_IS_CODE_GRAPH(enc,code) \ 387 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_GRAPH) 388 #define ONIGENC_IS_CODE_PRINT(enc,code) \ 389 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PRINT) 390 #define ONIGENC_IS_CODE_ALNUM(enc,code) \ 391 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALNUM) 392 #define ONIGENC_IS_CODE_ALPHA(enc,code) \ 393 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALPHA) 394 #define ONIGENC_IS_CODE_LOWER(enc,code) \ 395 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_LOWER) 396 #define ONIGENC_IS_CODE_UPPER(enc,code) \ 397 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_UPPER) 398 #define ONIGENC_IS_CODE_CNTRL(enc,code) \ 399 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_CNTRL) 400 #define ONIGENC_IS_CODE_PUNCT(enc,code) \ 401 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PUNCT) 402 #define ONIGENC_IS_CODE_SPACE(enc,code) \ 403 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_SPACE) 404 #define ONIGENC_IS_CODE_BLANK(enc,code) \ 405 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_BLANK) 406 #define ONIGENC_IS_CODE_DIGIT(enc,code) \ 407 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_DIGIT) 408 #define ONIGENC_IS_CODE_XDIGIT(enc,code) \ 409 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_XDIGIT) 410 #define ONIGENC_IS_CODE_WORD(enc,code) \ 411 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_WORD) 412 413 #define ONIGENC_GET_CTYPE_CODE_RANGE(enc,ctype,sbr,mbr) \ 414 (enc)->get_ctype_code_range(ctype,sbr,mbr) 415 416 ONIG_EXTERN 417 OnigUChar* onigenc_step_back P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, int n)); 418 419 #endif /* is not ONIG_RUBY_M17N */ 420 421 422 /* encoding API */ 423 ONIG_EXTERN 424 int onigenc_init P_((void)); 425 ONIG_EXTERN 426 int onigenc_set_default_encoding P_((OnigEncoding enc)); 427 ONIG_EXTERN 428 OnigEncoding onigenc_get_default_encoding P_((void)); 429 ONIG_EXTERN 430 void onigenc_set_default_caseconv_table P_((const OnigUChar* table)); 431 ONIG_EXTERN 432 OnigUChar* onigenc_get_right_adjust_char_head_with_prev P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, const OnigUChar** prev)); 433 ONIG_EXTERN 434 OnigUChar* onigenc_get_prev_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 435 ONIG_EXTERN 436 OnigUChar* onigenc_get_left_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 437 ONIG_EXTERN 438 OnigUChar* onigenc_get_right_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s)); 439 ONIG_EXTERN 440 int onigenc_strlen P_((OnigEncoding enc, const OnigUChar* p, const OnigUChar* end)); 441 ONIG_EXTERN 442 int onigenc_strlen_null P_((OnigEncoding enc, const OnigUChar* p)); 443 ONIG_EXTERN 444 int onigenc_str_bytelen_null P_((OnigEncoding enc, const OnigUChar* p)); 445 446 447 448 /* PART: regular expression */ 449 450 /* config parameters */ 451 #define ONIG_NREGION 10 452 #define ONIG_MAX_BACKREF_NUM 1000 453 #define ONIG_MAX_REPEAT_NUM 100000 454 #define ONIG_MAX_MULTI_BYTE_RANGES_NUM 10000 455 /* constants */ 456 #define ONIG_MAX_ERROR_MESSAGE_LEN 90 457 458 typedef unsigned int OnigOptionType; 459 460 #define ONIG_OPTION_DEFAULT ONIG_OPTION_NONE 461 462 /* options */ 463 #define ONIG_OPTION_NONE 0U 464 #define ONIG_OPTION_IGNORECASE 1U 465 #define ONIG_OPTION_EXTEND (ONIG_OPTION_IGNORECASE << 1) 466 #define ONIG_OPTION_MULTILINE (ONIG_OPTION_EXTEND << 1) 467 #define ONIG_OPTION_SINGLELINE (ONIG_OPTION_MULTILINE << 1) 468 #define ONIG_OPTION_FIND_LONGEST (ONIG_OPTION_SINGLELINE << 1) 469 #define ONIG_OPTION_FIND_NOT_EMPTY (ONIG_OPTION_FIND_LONGEST << 1) 470 #define ONIG_OPTION_NEGATE_SINGLELINE (ONIG_OPTION_FIND_NOT_EMPTY << 1) 471 #define ONIG_OPTION_DONT_CAPTURE_GROUP (ONIG_OPTION_NEGATE_SINGLELINE << 1) 472 #define ONIG_OPTION_CAPTURE_GROUP (ONIG_OPTION_DONT_CAPTURE_GROUP << 1) 473 /* options (search time) */ 474 #define ONIG_OPTION_NOTBOL (ONIG_OPTION_CAPTURE_GROUP << 1) 475 #define ONIG_OPTION_NOTEOL (ONIG_OPTION_NOTBOL << 1) 476 #define ONIG_OPTION_POSIX_REGION (ONIG_OPTION_NOTEOL << 1) 477 #define ONIG_OPTION_MAXBIT ONIG_OPTION_POSIX_REGION /* limit */ 478 479 #define ONIG_OPTION_ON(options,regopt) ((options) |= (regopt)) 480 #define ONIG_OPTION_OFF(options,regopt) ((options) &= ~(regopt)) 481 #define ONIG_IS_OPTION_ON(options,option) ((options) & (option)) 482 483 /* syntax */ 484 typedef struct { 485 unsigned int op; 486 unsigned int op2; 487 unsigned int behavior; 488 OnigOptionType options; /* default option */ 489 } OnigSyntaxType; 490 491 ONIG_EXTERN OnigSyntaxType OnigSyntaxASIS; 492 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixBasic; 493 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixExtended; 494 ONIG_EXTERN OnigSyntaxType OnigSyntaxEmacs; 495 ONIG_EXTERN OnigSyntaxType OnigSyntaxGrep; 496 ONIG_EXTERN OnigSyntaxType OnigSyntaxGnuRegex; 497 ONIG_EXTERN OnigSyntaxType OnigSyntaxJava; 498 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl; 499 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl_NG; 500 ONIG_EXTERN OnigSyntaxType OnigSyntaxRuby; 501 502 /* predefined syntaxes (see regsyntax.c) */ 503 #define ONIG_SYNTAX_ASIS (&OnigSyntaxASIS) 504 #define ONIG_SYNTAX_POSIX_BASIC (&OnigSyntaxPosixBasic) 505 #define ONIG_SYNTAX_POSIX_EXTENDED (&OnigSyntaxPosixExtended) 506 #define ONIG_SYNTAX_EMACS (&OnigSyntaxEmacs) 507 #define ONIG_SYNTAX_GREP (&OnigSyntaxGrep) 508 #define ONIG_SYNTAX_GNU_REGEX (&OnigSyntaxGnuRegex) 509 #define ONIG_SYNTAX_JAVA (&OnigSyntaxJava) 510 #define ONIG_SYNTAX_PERL (&OnigSyntaxPerl) 511 #define ONIG_SYNTAX_PERL_NG (&OnigSyntaxPerl_NG) 512 #define ONIG_SYNTAX_RUBY (&OnigSyntaxRuby) 513 514 /* default syntax */ 515 ONIG_EXTERN OnigSyntaxType* OnigDefaultSyntax; 516 #define ONIG_SYNTAX_DEFAULT OnigDefaultSyntax 517 518 /* syntax (operators) */ 519 #define ONIG_SYN_OP_VARIABLE_META_CHARACTERS (1U<<0) 520 #define ONIG_SYN_OP_DOT_ANYCHAR (1U<<1) /* . */ 521 #define ONIG_SYN_OP_ASTERISK_ZERO_INF (1U<<2) /* * */ 522 #define ONIG_SYN_OP_ESC_ASTERISK_ZERO_INF (1U<<3) 523 #define ONIG_SYN_OP_PLUS_ONE_INF (1U<<4) /* + */ 524 #define ONIG_SYN_OP_ESC_PLUS_ONE_INF (1U<<5) 525 #define ONIG_SYN_OP_QMARK_ZERO_ONE (1U<<6) /* ? */ 526 #define ONIG_SYN_OP_ESC_QMARK_ZERO_ONE (1U<<7) 527 #define ONIG_SYN_OP_BRACE_INTERVAL (1U<<8) /* {lower,upper} */ 528 #define ONIG_SYN_OP_ESC_BRACE_INTERVAL (1U<<9) /* \{lower,upper\} */ 529 #define ONIG_SYN_OP_VBAR_ALT (1U<<10) /* | */ 530 #define ONIG_SYN_OP_ESC_VBAR_ALT (1U<<11) /* \| */ 531 #define ONIG_SYN_OP_LPAREN_SUBEXP (1U<<12) /* (...) */ 532 #define ONIG_SYN_OP_ESC_LPAREN_SUBEXP (1U<<13) /* \(...\) */ 533 #define ONIG_SYN_OP_ESC_AZ_BUF_ANCHOR (1U<<14) /* \A, \Z, \z */ 534 #define ONIG_SYN_OP_ESC_CAPITAL_G_BEGIN_ANCHOR (1U<<15) /* \G */ 535 #define ONIG_SYN_OP_DECIMAL_BACKREF (1U<<16) /* \num */ 536 #define ONIG_SYN_OP_BRACKET_CC (1U<<17) /* [...] */ 537 #define ONIG_SYN_OP_ESC_W_WORD (1U<<18) /* \w, \W */ 538 #define ONIG_SYN_OP_ESC_LTGT_WORD_BEGIN_END (1U<<19) /* \<. \> */ 539 #define ONIG_SYN_OP_ESC_B_WORD_BOUND (1U<<20) /* \b, \B */ 540 #define ONIG_SYN_OP_ESC_S_WHITE_SPACE (1U<<21) /* \s, \S */ 541 #define ONIG_SYN_OP_ESC_D_DIGIT (1U<<22) /* \d, \D */ 542 #define ONIG_SYN_OP_LINE_ANCHOR (1U<<23) /* ^, $ */ 543 #define ONIG_SYN_OP_POSIX_BRACKET (1U<<24) /* [:xxxx:] */ 544 #define ONIG_SYN_OP_QMARK_NON_GREEDY (1U<<25) /* ??,*?,+?,{n,m}? */ 545 #define ONIG_SYN_OP_ESC_CONTROL_CHARS (1U<<26) /* \n,\r,\t,\a ... */ 546 #define ONIG_SYN_OP_ESC_C_CONTROL (1U<<27) /* \cx */ 547 #define ONIG_SYN_OP_ESC_OCTAL3 (1U<<28) /* \OOO */ 548 #define ONIG_SYN_OP_ESC_X_HEX2 (1U<<29) /* \xHH */ 549 #define ONIG_SYN_OP_ESC_X_BRACE_HEX8 (1U<<30) /* \x{7HHHHHHH} */ 550 551 #define ONIG_SYN_OP2_ESC_CAPITAL_Q_QUOTE (1U<<0) /* \Q...\E */ 552 #define ONIG_SYN_OP2_QMARK_GROUP_EFFECT (1U<<1) /* (?...) */ 553 #define ONIG_SYN_OP2_OPTION_PERL (1U<<2) /* (?imsx),(?-imsx) */ 554 #define ONIG_SYN_OP2_OPTION_RUBY (1U<<3) /* (?imx), (?-imx) */ 555 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_REPEAT (1U<<4) /* ?+,*+,++ */ 556 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_INTERVAL (1U<<5) /* {n,m}+ */ 557 #define ONIG_SYN_OP2_CCLASS_SET_OP (1U<<6) /* [...&&..[..]..] */ 558 #define ONIG_SYN_OP2_QMARK_LT_NAMED_GROUP (1U<<7) /* (?<name>...) */ 559 #define ONIG_SYN_OP2_ESC_K_NAMED_BACKREF (1U<<8) /* \k<name> */ 560 #define ONIG_SYN_OP2_ESC_G_SUBEXP_CALL (1U<<9) /* \g<name>, \g<n> */ 561 #define ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY (1U<<10) /* (?@..),(?@<x>..) */ 562 #define ONIG_SYN_OP2_ESC_CAPITAL_C_BAR_CONTROL (1U<<11) /* \C-x */ 563 #define ONIG_SYN_OP2_ESC_CAPITAL_M_BAR_META (1U<<12) /* \M-x */ 564 #define ONIG_SYN_OP2_ESC_V_VTAB (1U<<13) /* \v as VTAB */ 565 #define ONIG_SYN_OP2_ESC_U_HEX4 (1U<<14) /* \uHHHH */ 566 #define ONIG_SYN_OP2_ESC_GNU_BUF_ANCHOR (1U<<15) /* \`, \' */ 567 #define ONIG_SYN_OP2_ESC_P_BRACE_CHAR_PROPERTY (1U<<16) /* \p{...}, \P{...} */ 568 #define ONIG_SYN_OP2_ESC_P_BRACE_CIRCUMFLEX_NOT (1U<<17) /* \p{^..}, \P{^..} */ 569 #define ONIG_SYN_OP2_CHAR_PROPERTY_PREFIX_IS (1U<<18) /* \p{IsXDigit} */ 570 #define ONIG_SYN_OP2_ESC_H_XDIGIT (1U<<19) /* \h, \H */ 571 #define ONIG_SYN_OP2_INEFFECTIVE_ESCAPE (1U<<20) /* \ */ 572 573 /* syntax (behavior) */ 574 #define ONIG_SYN_CONTEXT_INDEP_ANCHORS (1U<<31) /* not implemented */ 575 #define ONIG_SYN_CONTEXT_INDEP_REPEAT_OPS (1U<<0) /* ?, *, +, {n,m} */ 576 #define ONIG_SYN_CONTEXT_INVALID_REPEAT_OPS (1U<<1) /* error or ignore */ 577 #define ONIG_SYN_ALLOW_UNMATCHED_CLOSE_SUBEXP (1U<<2) /* ...)... */ 578 #define ONIG_SYN_ALLOW_INVALID_INTERVAL (1U<<3) /* {??? */ 579 #define ONIG_SYN_ALLOW_INTERVAL_LOW_ABBREV (1U<<4) /* {,n} => {0,n} */ 580 #define ONIG_SYN_STRICT_CHECK_BACKREF (1U<<5) /* /(\1)/,/\1()/ ..*/ 581 #define ONIG_SYN_DIFFERENT_LEN_ALT_LOOK_BEHIND (1U<<6) /* (?<=a|bc) */ 582 #define ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP (1U<<7) /* see doc/RE */ 583 #define ONIG_SYN_ALLOW_MULTIPLEX_DEFINITION_NAME (1U<<8) /* (?<x>)(?<x>) */ 584 #define ONIG_SYN_FIXED_INTERVAL_IS_GREEDY_ONLY (1U<<9) /* a{n}?=(?:a{n})? */ 585 586 /* syntax (behavior) in char class [...] */ 587 #define ONIG_SYN_NOT_NEWLINE_IN_NEGATIVE_CC (1U<<20) /* [^...] */ 588 #define ONIG_SYN_BACKSLASH_ESCAPE_IN_CC (1U<<21) /* [..\w..] etc.. */ 589 #define ONIG_SYN_ALLOW_EMPTY_RANGE_IN_CC (1U<<22) 590 #define ONIG_SYN_ALLOW_DOUBLE_RANGE_OP_IN_CC (1U<<23) /* [0-9-a]=[0-9\-a] */ 591 /* syntax (behavior) warning */ 592 #define ONIG_SYN_WARN_CC_OP_NOT_ESCAPED (1U<<24) /* [,-,] */ 593 #define ONIG_SYN_WARN_REDUNDANT_NESTED_REPEAT (1U<<25) /* (?:a*)+ */ 594 595 /* meta character specifiers (onig_set_meta_char()) */ 596 #define ONIG_META_CHAR_ESCAPE 0 597 #define ONIG_META_CHAR_ANYCHAR 1 598 #define ONIG_META_CHAR_ANYTIME 2 599 #define ONIG_META_CHAR_ZERO_OR_ONE_TIME 3 600 #define ONIG_META_CHAR_ONE_OR_MORE_TIME 4 601 #define ONIG_META_CHAR_ANYCHAR_ANYTIME 5 602 603 #define ONIG_INEFFECTIVE_META_CHAR 0 604 605 /* error codes */ 606 #define ONIG_IS_PATTERN_ERROR(ecode) ((ecode) <= -100 && (ecode) > -1000) 607 /* normal return */ 608 #define ONIG_NORMAL 0 609 #define ONIG_MISMATCH -1 610 #define ONIG_NO_SUPPORT_CONFIG -2 611 612 /* internal error */ 613 #define ONIGERR_MEMORY -5 614 #define ONIGERR_TYPE_BUG -6 615 #define ONIGERR_PARSER_BUG -11 616 #define ONIGERR_STACK_BUG -12 617 #define ONIGERR_UNDEFINED_BYTECODE -13 618 #define ONIGERR_UNEXPECTED_BYTECODE -14 619 #define ONIGERR_MATCH_STACK_LIMIT_OVER -15 620 #define ONIGERR_DEFAULT_ENCODING_IS_NOT_SETTED -21 621 #define ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR -22 622 /* general error */ 623 #define ONIGERR_INVALID_ARGUMENT -30 624 /* syntax error */ 625 #define ONIGERR_END_PATTERN_AT_LEFT_BRACE -100 626 #define ONIGERR_END_PATTERN_AT_LEFT_BRACKET -101 627 #define ONIGERR_EMPTY_CHAR_CLASS -102 628 #define ONIGERR_PREMATURE_END_OF_CHAR_CLASS -103 629 #define ONIGERR_END_PATTERN_AT_ESCAPE -104 630 #define ONIGERR_END_PATTERN_AT_META -105 631 #define ONIGERR_END_PATTERN_AT_CONTROL -106 632 #define ONIGERR_META_CODE_SYNTAX -108 633 #define ONIGERR_CONTROL_CODE_SYNTAX -109 634 #define ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE -110 635 #define ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE -111 636 #define ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS -112 637 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED -113 638 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID -114 639 #define ONIGERR_NESTED_REPEAT_OPERATOR -115 640 #define ONIGERR_UNMATCHED_CLOSE_PARENTHESIS -116 641 #define ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS -117 642 #define ONIGERR_END_PATTERN_IN_GROUP -118 643 #define ONIGERR_UNDEFINED_GROUP_OPTION -119 644 #define ONIGERR_INVALID_POSIX_BRACKET_TYPE -121 645 #define ONIGERR_INVALID_LOOK_BEHIND_PATTERN -122 646 #define ONIGERR_INVALID_REPEAT_RANGE_PATTERN -123 647 /* values error (syntax error) */ 648 #define ONIGERR_TOO_BIG_NUMBER -200 649 #define ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE -201 650 #define ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE -202 651 #define ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS -203 652 #define ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE -204 653 #define ONIGERR_TOO_MANY_MULTI_BYTE_RANGES -205 654 #define ONIGERR_TOO_SHORT_MULTI_BYTE_STRING -206 655 #define ONIGERR_TOO_BIG_BACKREF_NUMBER -207 656 #define ONIGERR_INVALID_BACKREF -208 657 #define ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED -209 658 #define ONIGERR_TOO_LONG_WIDE_CHAR_VALUE -212 659 #define ONIGERR_EMPTY_GROUP_NAME -214 660 #define ONIGERR_INVALID_GROUP_NAME -215 661 #define ONIGERR_INVALID_CHAR_IN_GROUP_NAME -216 662 #define ONIGERR_UNDEFINED_NAME_REFERENCE -217 663 #define ONIGERR_UNDEFINED_GROUP_REFERENCE -218 664 #define ONIGERR_MULTIPLEX_DEFINED_NAME -219 665 #define ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL -220 666 #define ONIGERR_NEVER_ENDING_RECURSION -221 667 #define ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY -222 668 #define ONIGERR_INVALID_CHAR_PROPERTY_NAME -223 669 #define ONIGERR_INVALID_WIDE_CHAR_VALUE -400 670 #define ONIGERR_TOO_BIG_WIDE_CHAR_VALUE -401 671 #define ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION -402 672 #define ONIGERR_INVALID_COMBINATION_OF_OPTIONS -403 673 674 /* errors related to thread */ 675 #define ONIGERR_OVER_THREAD_PASS_LIMIT_COUNT -1001 676 677 678 /* must be smaller than BIT_STATUS_BITS_NUM (unsigned int * 8) */ 679 #define ONIG_MAX_CAPTURE_HISTORY_GROUP 31 680 #define ONIG_IS_CAPTURE_HISTORY_GROUP(r, i) \ 681 ((i) <= ONIG_MAX_CAPTURE_HISTORY_GROUP && (r)->list && (r)->list[i]) 682 683 typedef struct OnigCaptureTreeNodeStruct { 684 int group; /* group number */ 685 int beg; 686 int end; 687 int allocated; 688 int num_childs; 689 struct OnigCaptureTreeNodeStruct** childs; 690 } OnigCaptureTreeNode; 691 692 /* match result region type */ 693 struct re_registers { 694 int allocated; 695 int num_regs; 696 int* beg; 697 int* end; 698 /* extended */ 699 OnigCaptureTreeNode* history_root; /* capture history tree root */ 700 }; 701 702 /* capture tree traverse */ 703 #define ONIG_TRAVERSE_CALLBACK_AT_FIRST 1 704 #define ONIG_TRAVERSE_CALLBACK_AT_LAST 2 705 #define ONIG_TRAVERSE_CALLBACK_AT_BOTH \ 706 ( ONIG_TRAVERSE_CALLBACK_AT_FIRST | ONIG_TRAVERSE_CALLBACK_AT_LAST ) 707 708 709 #define ONIG_REGION_NOTPOS -1 710 711 typedef struct re_registers OnigRegion; 712 713 typedef struct { 714 OnigEncoding enc; 715 OnigUChar* par; 716 OnigUChar* par_end; 717 } OnigErrorInfo; 718 719 typedef struct { 720 int lower; 721 int upper; 722 } OnigRepeatRange; 723 724 typedef void (*OnigWarnFunc) P_((const char* s)); 725 extern void onig_null_warn P_((const char* s)); 726 #define ONIG_NULL_WARN onig_null_warn 727 728 #define ONIG_CHAR_TABLE_SIZE 256 729 730 /* regex_t state */ 731 #define ONIG_STATE_NORMAL 0 732 #define ONIG_STATE_SEARCHING 1 733 #define ONIG_STATE_COMPILING -1 734 #define ONIG_STATE_MODIFY -2 735 736 #define ONIG_STATE(reg) \ 737 ((reg)->state > 0 ? ONIG_STATE_SEARCHING : (reg)->state) 738 739 typedef struct re_pattern_buffer { 740 /* common members of BBuf(bytes-buffer) */ 741 unsigned char* p; /* compiled pattern */ 742 unsigned int used; /* used space for p */ 743 unsigned int alloc; /* allocated space for p */ 744 745 int state; /* normal, searching, compiling */ 746 int num_mem; /* used memory(...) num counted from 1 */ 747 int num_repeat; /* OP_REPEAT/OP_REPEAT_NG id-counter */ 748 int num_null_check; /* OP_NULL_CHECK_START/END id counter */ 749 int num_comb_exp_check; /* combination explosion check */ 750 int num_call; /* number of subexp call */ 751 unsigned int capture_history; /* (?@...) flag (1-31) */ 752 unsigned int bt_mem_start; /* need backtrack flag */ 753 unsigned int bt_mem_end; /* need backtrack flag */ 754 int stack_pop_level; 755 int repeat_range_alloc; 756 OnigRepeatRange* repeat_range; 757 758 OnigEncoding enc; 759 OnigOptionType options; 760 OnigSyntaxType* syntax; 761 OnigAmbigType ambig_flag; 762 void* name_table; 763 764 /* optimization info (string search, char-map and anchors) */ 765 int optimize; /* optimize flag */ 766 int threshold_len; /* search str-length for apply optimize */ 767 int anchor; /* BEGIN_BUF, BEGIN_POS, (SEMI_)END_BUF */ 768 OnigDistance anchor_dmin; /* (SEMI_)END_BUF anchor distance */ 769 OnigDistance anchor_dmax; /* (SEMI_)END_BUF anchor distance */ 770 int sub_anchor; /* start-anchor for exact or map */ 771 unsigned char *exact; 772 unsigned char *exact_end; 773 unsigned char map[ONIG_CHAR_TABLE_SIZE]; /* used as BM skip or char-map */ 774 int *int_map; /* BM skip for exact_len > 255 */ 775 int *int_map_backward; /* BM skip for backward search */ 776 OnigDistance dmin; /* min-distance of exact or map */ 777 OnigDistance dmax; /* max-distance of exact or map */ 778 779 /* regex_t link chain */ 780 struct re_pattern_buffer* chain; /* escape compile-conflict */ 781 } OnigRegexType; 782 783 typedef OnigRegexType* OnigRegex; 784 785 #ifndef ONIG_ESCAPE_REGEX_T_COLLISION 786 typedef OnigRegexType regex_t; 787 #endif 788 789 790 typedef struct { 791 int num_of_elements; 792 OnigEncoding pattern_enc; 793 OnigEncoding target_enc; 794 OnigSyntaxType* syntax; 795 OnigOptionType option; 796 OnigAmbigType ambig_flag; 797 } OnigCompileInfo; 798 799 /* Oniguruma Native API */ 800 ONIG_EXTERN 801 int onig_init P_((void)); 802 ONIG_EXTERN 803 int onig_error_code_to_str PV_((OnigUChar* s, int err_code, ...)); 804 ONIG_EXTERN 805 void onig_set_warn_func P_((OnigWarnFunc f)); 806 ONIG_EXTERN 807 void onig_set_verb_warn_func P_((OnigWarnFunc f)); 808 ONIG_EXTERN 809 int onig_new P_((OnigRegex*, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo)); 810 ONIG_EXTERN 811 int onig_new_deluxe P_((OnigRegex* reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo)); 812 ONIG_EXTERN 813 void onig_free P_((OnigRegex)); 814 ONIG_EXTERN 815 int onig_recompile P_((OnigRegex, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo)); 816 ONIG_EXTERN 817 int onig_recompile_deluxe P_((OnigRegex reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo)); 818 ONIG_EXTERN 819 int onig_search P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option)); 820 ONIG_EXTERN 821 int onig_match P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option)); 822 ONIG_EXTERN 823 OnigRegion* onig_region_new P_((void)); 824 ONIG_EXTERN 825 void onig_region_init P_((OnigRegion* region)); 826 ONIG_EXTERN 827 void onig_region_free P_((OnigRegion* region, int free_self)); 828 ONIG_EXTERN 829 void onig_region_copy P_((OnigRegion* to, OnigRegion* from)); 830 ONIG_EXTERN 831 void onig_region_clear P_((OnigRegion* region)); 832 ONIG_EXTERN 833 int onig_region_resize P_((OnigRegion* region, int n)); 834 ONIG_EXTERN 835 int onig_region_set P_((OnigRegion* region, int at, int beg, int end)); 836 ONIG_EXTERN 837 int onig_name_to_group_numbers P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, int** nums)); 838 ONIG_EXTERN 839 int onig_name_to_backref_number P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, OnigRegion *region)); 840 ONIG_EXTERN 841 int onig_foreach_name P_((OnigRegex reg, int (*func)(const OnigUChar*, const OnigUChar*,int,int*,OnigRegex,void*), void* arg)); 842 ONIG_EXTERN 843 int onig_number_of_names P_((OnigRegex reg)); 844 ONIG_EXTERN 845 int onig_number_of_captures P_((OnigRegex reg)); 846 ONIG_EXTERN 847 int onig_number_of_capture_histories P_((OnigRegex reg)); 848 ONIG_EXTERN 849 OnigCaptureTreeNode* onig_get_capture_tree P_((OnigRegion* region)); 850 ONIG_EXTERN 851 int onig_capture_tree_traverse P_((OnigRegion* region, int at, int(*callback_func)(int,int,int,int,int,void*), void* arg)); 852 ONIG_EXTERN 853 int onig_noname_group_capture_is_active P_((OnigRegex reg)); 854 ONIG_EXTERN 855 OnigEncoding onig_get_encoding P_((OnigRegex reg)); 856 ONIG_EXTERN 857 OnigOptionType onig_get_options P_((OnigRegex reg)); 858 ONIG_EXTERN 859 OnigAmbigType onig_get_ambig_flag P_((OnigRegex reg)); 860 ONIG_EXTERN 861 OnigSyntaxType* onig_get_syntax P_((OnigRegex reg)); 862 ONIG_EXTERN 863 int onig_set_default_syntax P_((OnigSyntaxType* syntax)); 864 ONIG_EXTERN 865 void onig_copy_syntax P_((OnigSyntaxType* to, OnigSyntaxType* from)); 866 ONIG_EXTERN 867 unsigned int onig_get_syntax_op P_((OnigSyntaxType* syntax)); 868 ONIG_EXTERN 869 unsigned int onig_get_syntax_op2 P_((OnigSyntaxType* syntax)); 870 ONIG_EXTERN 871 unsigned int onig_get_syntax_behavior P_((OnigSyntaxType* syntax)); 872 ONIG_EXTERN 873 OnigOptionType onig_get_syntax_options P_((OnigSyntaxType* syntax)); 874 ONIG_EXTERN 875 void onig_set_syntax_op P_((OnigSyntaxType* syntax, unsigned int op)); 876 ONIG_EXTERN 877 void onig_set_syntax_op2 P_((OnigSyntaxType* syntax, unsigned int op2)); 878 ONIG_EXTERN 879 void onig_set_syntax_behavior P_((OnigSyntaxType* syntax, unsigned int behavior)); 880 ONIG_EXTERN 881 void onig_set_syntax_options P_((OnigSyntaxType* syntax, OnigOptionType options)); 882 ONIG_EXTERN 883 int onig_set_meta_char P_((OnigEncoding enc, unsigned int what, OnigCodePoint code)); 884 ONIG_EXTERN 885 void onig_copy_encoding P_((OnigEncoding to, OnigEncoding from)); 886 ONIG_EXTERN 887 OnigAmbigType onig_get_default_ambig_flag P_((void)); 888 ONIG_EXTERN 889 int onig_set_default_ambig_flag P_((OnigAmbigType ambig_flag)); 890 ONIG_EXTERN 891 unsigned int onig_get_match_stack_limit_size P_((void)); 892 ONIG_EXTERN 893 int onig_set_match_stack_limit_size P_((unsigned int size)); 894 ONIG_EXTERN 895 int onig_end P_((void)); 896 ONIG_EXTERN 897 const char* onig_version P_((void)); 898 ONIG_EXTERN 899 const char* onig_copyright P_((void)); 900 901 #ifdef __cplusplus 902 } 903 #endif 904 905 #endif /* ONIGURUMA_H */ 906