1 #ifndef ONIGURUMA_H
2 #define ONIGURUMA_H
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32 #ifdef __cplusplus
33 extern "C" {
34 #endif
35
36 #define ONIGURUMA
37 #define ONIGURUMA_VERSION_MAJOR 5
38 #define ONIGURUMA_VERSION_MINOR 9
39 #define ONIGURUMA_VERSION_TEENY 6
40
41 #ifdef __cplusplus
42 # ifndef HAVE_PROTOTYPES
43 # define HAVE_PROTOTYPES 1
44 # endif
45 # ifndef HAVE_STDARG_PROTOTYPES
46 # define HAVE_STDARG_PROTOTYPES 1
47 # endif
48 #endif
49
50
51 #if defined(__APPLE__) && defined(__GNUC__) && __GNUC__ >= 4
52 # ifndef HAVE_STDARG_PROTOTYPES
53 # define HAVE_STDARG_PROTOTYPES 1
54 # endif
55 #endif
56
57 #ifdef HAVE_STDARG_H
58 # ifndef HAVE_STDARG_PROTOTYPES
59 # define HAVE_STDARG_PROTOTYPES 1
60 # endif
61 #endif
62
63 #ifndef P_
64 #if defined(__STDC__) || defined(_WIN32)
65 # define P_(args) args
66 #else
67 # define P_(args) ()
68 #endif
69 #endif
70
71 #ifndef PV_
72 #ifdef HAVE_STDARG_PROTOTYPES
73 # define PV_(args) args
74 #else
75 # define PV_(args) ()
76 #endif
77 #endif
78
79 #ifndef ONIG_EXTERN
80 #if defined(_WIN32) && !defined(__GNUC__)
81 #if defined(EXPORT) || defined(RUBY_EXPORT)
82 #define ONIG_EXTERN extern __declspec(dllexport)
83 #else
84 #define ONIG_EXTERN extern __declspec(dllimport)
85 #endif
86 #endif
87 #endif
88
89 #ifndef ONIG_EXTERN
90 #define ONIG_EXTERN extern
91 #endif
92
93
94
95 #ifndef ONIG_ESCAPE_UCHAR_COLLISION
96 #define UChar OnigUChar
97 #endif
98
99 #ifdef _WIN32
100 # include <windows.h>
101 typedef ULONG_PTR OnigCodePoint;
102 #else
103 typedef unsigned long OnigCodePoint;
104 #endif
105 typedef unsigned char OnigUChar;
106 typedef unsigned int OnigCtype;
107 typedef unsigned int OnigDistance;
108
109 #define ONIG_INFINITE_DISTANCE ~((OnigDistance )0)
110
111 typedef unsigned int OnigCaseFoldType;
112
113 ONIG_EXTERN OnigCaseFoldType OnigDefaultCaseFoldFlag;
114
115
116
117 #define ONIGENC_CASE_FOLD_TURKISH_AZERI (1<<20)
118 #define INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR (1<<30)
119
120 #define ONIGENC_CASE_FOLD_MIN INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR
121 #define ONIGENC_CASE_FOLD_DEFAULT OnigDefaultCaseFoldFlag
122
123
124 #define ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN 3
125 #define ONIGENC_GET_CASE_FOLD_CODES_MAX_NUM 13
126
127
128
129 #define ONIGENC_CODE_RANGE_NUM(range) ((int )range[0])
130 #define ONIGENC_CODE_RANGE_FROM(range,i) range[((i)*2) + 1]
131 #define ONIGENC_CODE_RANGE_TO(range,i) range[((i)*2) + 2]
132
133 typedef struct {
134 int byte_len;
135 int code_len;
136 OnigCodePoint code[ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN];
137 } OnigCaseFoldCodeItem;
138
139 typedef struct {
140 OnigCodePoint esc;
141 OnigCodePoint anychar;
142 OnigCodePoint anytime;
143 OnigCodePoint zero_or_one_time;
144 OnigCodePoint one_or_more_time;
145 OnigCodePoint anychar_anytime;
146 } OnigMetaCharTableType;
147
148 typedef int (*OnigApplyAllCaseFoldFunc)(OnigCodePoint from, OnigCodePoint* to, int to_len, void* arg);
149
150 typedef struct OnigEncodingTypeST {
151 int (*mbc_enc_len)(const OnigUChar* p);
152 const char* name;
153 int max_enc_len;
154 int min_enc_len;
155 int (*is_mbc_newline)(const OnigUChar* p, const OnigUChar* end);
156 OnigCodePoint (*mbc_to_code)(const OnigUChar* p, const OnigUChar* end);
157 int (*code_to_mbclen)(OnigCodePoint code);
158 int (*code_to_mbc)(OnigCodePoint code, OnigUChar *buf);
159 int (*mbc_case_fold)(OnigCaseFoldType flag, const OnigUChar** pp, const OnigUChar* end, OnigUChar* to);
160 int (*apply_all_case_fold)(OnigCaseFoldType flag, OnigApplyAllCaseFoldFunc f, void* arg);
161 int (*get_case_fold_codes_by_str)(OnigCaseFoldType flag, const OnigUChar* p, const OnigUChar* end, OnigCaseFoldCodeItem acs[]);
162 int (*property_name_to_ctype)(struct OnigEncodingTypeST* enc, OnigUChar* p, OnigUChar* end);
163 int (*is_code_ctype)(OnigCodePoint code, OnigCtype ctype);
164 int (*get_ctype_code_range)(OnigCtype ctype, OnigCodePoint* sb_out, const OnigCodePoint* ranges[]);
165 OnigUChar* (*left_adjust_char_head)(const OnigUChar* start, const OnigUChar* p);
166 int (*is_allowed_reverse_match)(const OnigUChar* p, const OnigUChar* end);
167 } OnigEncodingType;
168
169 typedef OnigEncodingType* OnigEncoding;
170
171 ONIG_EXTERN OnigEncodingType OnigEncodingASCII;
172 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_1;
173 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_2;
174 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_3;
175 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_4;
176 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_5;
177 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_6;
178 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_7;
179 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_8;
180 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_9;
181 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_10;
182 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_11;
183 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_13;
184 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_14;
185 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_15;
186 ONIG_EXTERN OnigEncodingType OnigEncodingISO_8859_16;
187 ONIG_EXTERN OnigEncodingType OnigEncodingUTF8;
188 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_BE;
189 ONIG_EXTERN OnigEncodingType OnigEncodingUTF16_LE;
190 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_BE;
191 ONIG_EXTERN OnigEncodingType OnigEncodingUTF32_LE;
192 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_JP;
193 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_TW;
194 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_KR;
195 ONIG_EXTERN OnigEncodingType OnigEncodingEUC_CN;
196 ONIG_EXTERN OnigEncodingType OnigEncodingSJIS;
197 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8;
198 ONIG_EXTERN OnigEncodingType OnigEncodingKOI8_R;
199 ONIG_EXTERN OnigEncodingType OnigEncodingCP1251;
200 ONIG_EXTERN OnigEncodingType OnigEncodingBIG5;
201 ONIG_EXTERN OnigEncodingType OnigEncodingGB18030;
202
203 #define ONIG_ENCODING_ASCII (&OnigEncodingASCII)
204 #define ONIG_ENCODING_ISO_8859_1 (&OnigEncodingISO_8859_1)
205 #define ONIG_ENCODING_ISO_8859_2 (&OnigEncodingISO_8859_2)
206 #define ONIG_ENCODING_ISO_8859_3 (&OnigEncodingISO_8859_3)
207 #define ONIG_ENCODING_ISO_8859_4 (&OnigEncodingISO_8859_4)
208 #define ONIG_ENCODING_ISO_8859_5 (&OnigEncodingISO_8859_5)
209 #define ONIG_ENCODING_ISO_8859_6 (&OnigEncodingISO_8859_6)
210 #define ONIG_ENCODING_ISO_8859_7 (&OnigEncodingISO_8859_7)
211 #define ONIG_ENCODING_ISO_8859_8 (&OnigEncodingISO_8859_8)
212 #define ONIG_ENCODING_ISO_8859_9 (&OnigEncodingISO_8859_9)
213 #define ONIG_ENCODING_ISO_8859_10 (&OnigEncodingISO_8859_10)
214 #define ONIG_ENCODING_ISO_8859_11 (&OnigEncodingISO_8859_11)
215 #define ONIG_ENCODING_ISO_8859_13 (&OnigEncodingISO_8859_13)
216 #define ONIG_ENCODING_ISO_8859_14 (&OnigEncodingISO_8859_14)
217 #define ONIG_ENCODING_ISO_8859_15 (&OnigEncodingISO_8859_15)
218 #define ONIG_ENCODING_ISO_8859_16 (&OnigEncodingISO_8859_16)
219 #define ONIG_ENCODING_UTF8 (&OnigEncodingUTF8)
220 #define ONIG_ENCODING_UTF16_BE (&OnigEncodingUTF16_BE)
221 #define ONIG_ENCODING_UTF16_LE (&OnigEncodingUTF16_LE)
222 #define ONIG_ENCODING_UTF32_BE (&OnigEncodingUTF32_BE)
223 #define ONIG_ENCODING_UTF32_LE (&OnigEncodingUTF32_LE)
224 #define ONIG_ENCODING_EUC_JP (&OnigEncodingEUC_JP)
225 #define ONIG_ENCODING_EUC_TW (&OnigEncodingEUC_TW)
226 #define ONIG_ENCODING_EUC_KR (&OnigEncodingEUC_KR)
227 #define ONIG_ENCODING_EUC_CN (&OnigEncodingEUC_CN)
228 #define ONIG_ENCODING_SJIS (&OnigEncodingSJIS)
229 #define ONIG_ENCODING_KOI8 (&OnigEncodingKOI8)
230 #define ONIG_ENCODING_KOI8_R (&OnigEncodingKOI8_R)
231 #define ONIG_ENCODING_CP1251 (&OnigEncodingCP1251)
232 #define ONIG_ENCODING_BIG5 (&OnigEncodingBIG5)
233 #define ONIG_ENCODING_GB18030 (&OnigEncodingGB18030)
234
235 #define ONIG_ENCODING_UNDEF ((OnigEncoding )0)
236
237
238
239 #define ONIGENC_CODE_TO_MBC_MAXLEN 7
240 #define ONIGENC_MBC_CASE_FOLD_MAXLEN 18
241
242
243
244 #define ONIGENC_CTYPE_NEWLINE 0
245 #define ONIGENC_CTYPE_ALPHA 1
246 #define ONIGENC_CTYPE_BLANK 2
247 #define ONIGENC_CTYPE_CNTRL 3
248 #define ONIGENC_CTYPE_DIGIT 4
249 #define ONIGENC_CTYPE_GRAPH 5
250 #define ONIGENC_CTYPE_LOWER 6
251 #define ONIGENC_CTYPE_PRINT 7
252 #define ONIGENC_CTYPE_PUNCT 8
253 #define ONIGENC_CTYPE_SPACE 9
254 #define ONIGENC_CTYPE_UPPER 10
255 #define ONIGENC_CTYPE_XDIGIT 11
256 #define ONIGENC_CTYPE_WORD 12
257 #define ONIGENC_CTYPE_ALNUM 13
258 #define ONIGENC_CTYPE_ASCII 14
259 #define ONIGENC_MAX_STD_CTYPE ONIGENC_CTYPE_ASCII
260
261
262 #define onig_enc_len(enc,p,end) ONIGENC_MBC_ENC_LEN(enc,p)
263
264 #define ONIGENC_IS_UNDEF(enc) ((enc) == ONIG_ENCODING_UNDEF)
265 #define ONIGENC_IS_SINGLEBYTE(enc) (ONIGENC_MBC_MAXLEN(enc) == 1)
266 #define ONIGENC_IS_MBC_HEAD(enc,p) (ONIGENC_MBC_ENC_LEN(enc,p) != 1)
267 #define ONIGENC_IS_MBC_ASCII(p) (*(p) < 128)
268 #define ONIGENC_IS_CODE_ASCII(code) ((code) < 128)
269 #define ONIGENC_IS_MBC_WORD(enc,s,end) \
270 ONIGENC_IS_CODE_WORD(enc,ONIGENC_MBC_TO_CODE(enc,s,end))
271
272
273 #define ONIGENC_NAME(enc) ((enc)->name)
274
275 #define ONIGENC_MBC_CASE_FOLD(enc,flag,pp,end,buf) \
276 (enc)->mbc_case_fold(flag,(const OnigUChar** )pp,end,buf)
277 #define ONIGENC_IS_ALLOWED_REVERSE_MATCH(enc,s,end) \
278 (enc)->is_allowed_reverse_match(s,end)
279 #define ONIGENC_LEFT_ADJUST_CHAR_HEAD(enc,start,s) \
280 (enc)->left_adjust_char_head(start, s)
281 #define ONIGENC_APPLY_ALL_CASE_FOLD(enc,case_fold_flag,f,arg) \
282 (enc)->apply_all_case_fold(case_fold_flag,f,arg)
283 #define ONIGENC_GET_CASE_FOLD_CODES_BY_STR(enc,case_fold_flag,p,end,acs) \
284 (enc)->get_case_fold_codes_by_str(case_fold_flag,p,end,acs)
285 #define ONIGENC_STEP_BACK(enc,start,s,n) \
286 onigenc_step_back((enc),(start),(s),(n))
287
288 #define ONIGENC_MBC_ENC_LEN(enc,p) (enc)->mbc_enc_len(p)
289 #define ONIGENC_MBC_MAXLEN(enc) ((enc)->max_enc_len)
290 #define ONIGENC_MBC_MAXLEN_DIST(enc) ONIGENC_MBC_MAXLEN(enc)
291 #define ONIGENC_MBC_MINLEN(enc) ((enc)->min_enc_len)
292 #define ONIGENC_IS_MBC_NEWLINE(enc,p,end) (enc)->is_mbc_newline((p),(end))
293 #define ONIGENC_MBC_TO_CODE(enc,p,end) (enc)->mbc_to_code((p),(end))
294 #define ONIGENC_CODE_TO_MBCLEN(enc,code) (enc)->code_to_mbclen(code)
295 #define ONIGENC_CODE_TO_MBC(enc,code,buf) (enc)->code_to_mbc(code,buf)
296 #define ONIGENC_PROPERTY_NAME_TO_CTYPE(enc,p,end) \
297 (enc)->property_name_to_ctype(enc,p,end)
298
299 #define ONIGENC_IS_CODE_CTYPE(enc,code,ctype) (enc)->is_code_ctype(code,ctype)
300
301 #define ONIGENC_IS_CODE_NEWLINE(enc,code) \
302 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_NEWLINE)
303 #define ONIGENC_IS_CODE_GRAPH(enc,code) \
304 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_GRAPH)
305 #define ONIGENC_IS_CODE_PRINT(enc,code) \
306 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PRINT)
307 #define ONIGENC_IS_CODE_ALNUM(enc,code) \
308 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALNUM)
309 #define ONIGENC_IS_CODE_ALPHA(enc,code) \
310 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_ALPHA)
311 #define ONIGENC_IS_CODE_LOWER(enc,code) \
312 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_LOWER)
313 #define ONIGENC_IS_CODE_UPPER(enc,code) \
314 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_UPPER)
315 #define ONIGENC_IS_CODE_CNTRL(enc,code) \
316 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_CNTRL)
317 #define ONIGENC_IS_CODE_PUNCT(enc,code) \
318 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_PUNCT)
319 #define ONIGENC_IS_CODE_SPACE(enc,code) \
320 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_SPACE)
321 #define ONIGENC_IS_CODE_BLANK(enc,code) \
322 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_BLANK)
323 #define ONIGENC_IS_CODE_DIGIT(enc,code) \
324 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_DIGIT)
325 #define ONIGENC_IS_CODE_XDIGIT(enc,code) \
326 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_XDIGIT)
327 #define ONIGENC_IS_CODE_WORD(enc,code) \
328 ONIGENC_IS_CODE_CTYPE(enc,code,ONIGENC_CTYPE_WORD)
329
330 #define ONIGENC_GET_CTYPE_CODE_RANGE(enc,ctype,sbout,ranges) \
331 (enc)->get_ctype_code_range(ctype,sbout,ranges)
332
333 ONIG_EXTERN
334 OnigUChar* onigenc_step_back P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, int n));
335
336
337
338 ONIG_EXTERN
339 int onigenc_init P_((void));
340 ONIG_EXTERN
341 int onigenc_set_default_encoding P_((OnigEncoding enc));
342 ONIG_EXTERN
343 OnigEncoding onigenc_get_default_encoding P_((void));
344 ONIG_EXTERN
345 void onigenc_set_default_caseconv_table P_((const OnigUChar* table));
346 ONIG_EXTERN
347 OnigUChar* onigenc_get_right_adjust_char_head_with_prev P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s, const OnigUChar** prev));
348 ONIG_EXTERN
349 OnigUChar* onigenc_get_prev_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
350 ONIG_EXTERN
351 OnigUChar* onigenc_get_left_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
352 ONIG_EXTERN
353 OnigUChar* onigenc_get_right_adjust_char_head P_((OnigEncoding enc, const OnigUChar* start, const OnigUChar* s));
354 ONIG_EXTERN
355 int onigenc_strlen P_((OnigEncoding enc, const OnigUChar* p, const OnigUChar* end));
356 ONIG_EXTERN
357 int onigenc_strlen_null P_((OnigEncoding enc, const OnigUChar* p));
358 ONIG_EXTERN
359 int onigenc_str_bytelen_null P_((OnigEncoding enc, const OnigUChar* p));
360
361
362
363
364
365
366 #define ONIG_NREGION 10
367 #define ONIG_MAX_BACKREF_NUM 1000
368 #define ONIG_MAX_REPEAT_NUM 100000
369 #define ONIG_MAX_MULTI_BYTE_RANGES_NUM 10000
370
371 #define ONIG_MAX_ERROR_MESSAGE_LEN 90
372
373 typedef unsigned int OnigOptionType;
374
375 #define ONIG_OPTION_DEFAULT ONIG_OPTION_NONE
376
377
378 #define ONIG_OPTION_NONE 0U
379 #define ONIG_OPTION_IGNORECASE 1U
380 #define ONIG_OPTION_EXTEND (ONIG_OPTION_IGNORECASE << 1)
381 #define ONIG_OPTION_MULTILINE (ONIG_OPTION_EXTEND << 1)
382 #define ONIG_OPTION_SINGLELINE (ONIG_OPTION_MULTILINE << 1)
383 #define ONIG_OPTION_FIND_LONGEST (ONIG_OPTION_SINGLELINE << 1)
384 #define ONIG_OPTION_FIND_NOT_EMPTY (ONIG_OPTION_FIND_LONGEST << 1)
385 #define ONIG_OPTION_NEGATE_SINGLELINE (ONIG_OPTION_FIND_NOT_EMPTY << 1)
386 #define ONIG_OPTION_DONT_CAPTURE_GROUP (ONIG_OPTION_NEGATE_SINGLELINE << 1)
387 #define ONIG_OPTION_CAPTURE_GROUP (ONIG_OPTION_DONT_CAPTURE_GROUP << 1)
388
389 #define ONIG_OPTION_NOTBOL (ONIG_OPTION_CAPTURE_GROUP << 1)
390 #define ONIG_OPTION_NOTEOL (ONIG_OPTION_NOTBOL << 1)
391 #define ONIG_OPTION_POSIX_REGION (ONIG_OPTION_NOTEOL << 1)
392 #define ONIG_OPTION_MAXBIT ONIG_OPTION_POSIX_REGION
393
394 #define ONIG_OPTION_ON(options,regopt) ((options) |= (regopt))
395 #define ONIG_OPTION_OFF(options,regopt) ((options) &= ~(regopt))
396 #define ONIG_IS_OPTION_ON(options,option) ((options) & (option))
397
398
399 typedef struct {
400 unsigned int op;
401 unsigned int op2;
402 unsigned int behavior;
403 OnigOptionType options;
404 OnigMetaCharTableType meta_char_table;
405 } OnigSyntaxType;
406
407 ONIG_EXTERN OnigSyntaxType OnigSyntaxASIS;
408 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixBasic;
409 ONIG_EXTERN OnigSyntaxType OnigSyntaxPosixExtended;
410 ONIG_EXTERN OnigSyntaxType OnigSyntaxEmacs;
411 ONIG_EXTERN OnigSyntaxType OnigSyntaxGrep;
412 ONIG_EXTERN OnigSyntaxType OnigSyntaxGnuRegex;
413 ONIG_EXTERN OnigSyntaxType OnigSyntaxJava;
414 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl;
415 ONIG_EXTERN OnigSyntaxType OnigSyntaxPerl_NG;
416 ONIG_EXTERN OnigSyntaxType OnigSyntaxRuby;
417
418
419 #define ONIG_SYNTAX_ASIS (&OnigSyntaxASIS)
420 #define ONIG_SYNTAX_POSIX_BASIC (&OnigSyntaxPosixBasic)
421 #define ONIG_SYNTAX_POSIX_EXTENDED (&OnigSyntaxPosixExtended)
422 #define ONIG_SYNTAX_EMACS (&OnigSyntaxEmacs)
423 #define ONIG_SYNTAX_GREP (&OnigSyntaxGrep)
424 #define ONIG_SYNTAX_GNU_REGEX (&OnigSyntaxGnuRegex)
425 #define ONIG_SYNTAX_JAVA (&OnigSyntaxJava)
426 #define ONIG_SYNTAX_PERL (&OnigSyntaxPerl)
427 #define ONIG_SYNTAX_PERL_NG (&OnigSyntaxPerl_NG)
428 #define ONIG_SYNTAX_RUBY (&OnigSyntaxRuby)
429
430
431 ONIG_EXTERN OnigSyntaxType* OnigDefaultSyntax;
432 #define ONIG_SYNTAX_DEFAULT OnigDefaultSyntax
433
434
435 #define ONIG_SYN_OP_VARIABLE_META_CHARACTERS (1U<<0)
436 #define ONIG_SYN_OP_DOT_ANYCHAR (1U<<1)
437 #define ONIG_SYN_OP_ASTERISK_ZERO_INF (1U<<2)
438 #define ONIG_SYN_OP_ESC_ASTERISK_ZERO_INF (1U<<3)
439 #define ONIG_SYN_OP_PLUS_ONE_INF (1U<<4)
440 #define ONIG_SYN_OP_ESC_PLUS_ONE_INF (1U<<5)
441 #define ONIG_SYN_OP_QMARK_ZERO_ONE (1U<<6)
442 #define ONIG_SYN_OP_ESC_QMARK_ZERO_ONE (1U<<7)
443 #define ONIG_SYN_OP_BRACE_INTERVAL (1U<<8)
444 #define ONIG_SYN_OP_ESC_BRACE_INTERVAL (1U<<9)
445 #define ONIG_SYN_OP_VBAR_ALT (1U<<10)
446 #define ONIG_SYN_OP_ESC_VBAR_ALT (1U<<11)
447 #define ONIG_SYN_OP_LPAREN_SUBEXP (1U<<12)
448 #define ONIG_SYN_OP_ESC_LPAREN_SUBEXP (1U<<13)
449 #define ONIG_SYN_OP_ESC_AZ_BUF_ANCHOR (1U<<14)
450 #define ONIG_SYN_OP_ESC_CAPITAL_G_BEGIN_ANCHOR (1U<<15)
451 #define ONIG_SYN_OP_DECIMAL_BACKREF (1U<<16)
452 #define ONIG_SYN_OP_BRACKET_CC (1U<<17)
453 #define ONIG_SYN_OP_ESC_W_WORD (1U<<18)
454 #define ONIG_SYN_OP_ESC_LTGT_WORD_BEGIN_END (1U<<19)
455 #define ONIG_SYN_OP_ESC_B_WORD_BOUND (1U<<20)
456 #define ONIG_SYN_OP_ESC_S_WHITE_SPACE (1U<<21)
457 #define ONIG_SYN_OP_ESC_D_DIGIT (1U<<22)
458 #define ONIG_SYN_OP_LINE_ANCHOR (1U<<23)
459 #define ONIG_SYN_OP_POSIX_BRACKET (1U<<24)
460 #define ONIG_SYN_OP_QMARK_NON_GREEDY (1U<<25)
461 #define ONIG_SYN_OP_ESC_CONTROL_CHARS (1U<<26)
462 #define ONIG_SYN_OP_ESC_C_CONTROL (1U<<27)
463 #define ONIG_SYN_OP_ESC_OCTAL3 (1U<<28)
464 #define ONIG_SYN_OP_ESC_X_HEX2 (1U<<29)
465 #define ONIG_SYN_OP_ESC_X_BRACE_HEX8 (1U<<30)
466
467 #define ONIG_SYN_OP2_ESC_CAPITAL_Q_QUOTE (1U<<0)
468 #define ONIG_SYN_OP2_QMARK_GROUP_EFFECT (1U<<1)
469 #define ONIG_SYN_OP2_OPTION_PERL (1U<<2)
470 #define ONIG_SYN_OP2_OPTION_RUBY (1U<<3)
471 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_REPEAT (1U<<4)
472 #define ONIG_SYN_OP2_PLUS_POSSESSIVE_INTERVAL (1U<<5)
473 #define ONIG_SYN_OP2_CCLASS_SET_OP (1U<<6)
474 #define ONIG_SYN_OP2_QMARK_LT_NAMED_GROUP (1U<<7)
475 #define ONIG_SYN_OP2_ESC_K_NAMED_BACKREF (1U<<8)
476 #define ONIG_SYN_OP2_ESC_G_SUBEXP_CALL (1U<<9)
477 #define ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY (1U<<10)
478 #define ONIG_SYN_OP2_ESC_CAPITAL_C_BAR_CONTROL (1U<<11)
479 #define ONIG_SYN_OP2_ESC_CAPITAL_M_BAR_META (1U<<12)
480 #define ONIG_SYN_OP2_ESC_V_VTAB (1U<<13)
481 #define ONIG_SYN_OP2_ESC_U_HEX4 (1U<<14)
482 #define ONIG_SYN_OP2_ESC_GNU_BUF_ANCHOR (1U<<15)
483 #define ONIG_SYN_OP2_ESC_P_BRACE_CHAR_PROPERTY (1U<<16)
484 #define ONIG_SYN_OP2_ESC_P_BRACE_CIRCUMFLEX_NOT (1U<<17)
485
486 #define ONIG_SYN_OP2_ESC_H_XDIGIT (1U<<19)
487 #define ONIG_SYN_OP2_INEFFECTIVE_ESCAPE (1U<<20)
488
489
490 #define ONIG_SYN_CONTEXT_INDEP_ANCHORS (1U<<31)
491 #define ONIG_SYN_CONTEXT_INDEP_REPEAT_OPS (1U<<0)
492 #define ONIG_SYN_CONTEXT_INVALID_REPEAT_OPS (1U<<1)
493 #define ONIG_SYN_ALLOW_UNMATCHED_CLOSE_SUBEXP (1U<<2)
494 #define ONIG_SYN_ALLOW_INVALID_INTERVAL (1U<<3)
495 #define ONIG_SYN_ALLOW_INTERVAL_LOW_ABBREV (1U<<4)
496 #define ONIG_SYN_STRICT_CHECK_BACKREF (1U<<5)
497 #define ONIG_SYN_DIFFERENT_LEN_ALT_LOOK_BEHIND (1U<<6)
498 #define ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP (1U<<7)
499 #define ONIG_SYN_ALLOW_MULTIPLEX_DEFINITION_NAME (1U<<8)
500 #define ONIG_SYN_FIXED_INTERVAL_IS_GREEDY_ONLY (1U<<9)
501
502
503 #define ONIG_SYN_NOT_NEWLINE_IN_NEGATIVE_CC (1U<<20)
504 #define ONIG_SYN_BACKSLASH_ESCAPE_IN_CC (1U<<21)
505 #define ONIG_SYN_ALLOW_EMPTY_RANGE_IN_CC (1U<<22)
506 #define ONIG_SYN_ALLOW_DOUBLE_RANGE_OP_IN_CC (1U<<23)
507
508 #define ONIG_SYN_WARN_CC_OP_NOT_ESCAPED (1U<<24)
509 #define ONIG_SYN_WARN_REDUNDANT_NESTED_REPEAT (1U<<25)
510
511
512 #define ONIG_META_CHAR_ESCAPE 0
513 #define ONIG_META_CHAR_ANYCHAR 1
514 #define ONIG_META_CHAR_ANYTIME 2
515 #define ONIG_META_CHAR_ZERO_OR_ONE_TIME 3
516 #define ONIG_META_CHAR_ONE_OR_MORE_TIME 4
517 #define ONIG_META_CHAR_ANYCHAR_ANYTIME 5
518
519 #define ONIG_INEFFECTIVE_META_CHAR 0
520
521
522 #define ONIG_IS_PATTERN_ERROR(ecode) ((ecode) <= -100 && (ecode) > -1000)
523
524 #define ONIG_NORMAL 0
525 #define ONIG_MISMATCH -1
526 #define ONIG_NO_SUPPORT_CONFIG -2
527
528
529 #define ONIGERR_MEMORY -5
530 #define ONIGERR_TYPE_BUG -6
531 #define ONIGERR_PARSER_BUG -11
532 #define ONIGERR_STACK_BUG -12
533 #define ONIGERR_UNDEFINED_BYTECODE -13
534 #define ONIGERR_UNEXPECTED_BYTECODE -14
535 #define ONIGERR_MATCH_STACK_LIMIT_OVER -15
536 #define ONIGERR_DEFAULT_ENCODING_IS_NOT_SETTED -21
537 #define ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR -22
538
539 #define ONIGERR_INVALID_ARGUMENT -30
540
541 #define ONIGERR_END_PATTERN_AT_LEFT_BRACE -100
542 #define ONIGERR_END_PATTERN_AT_LEFT_BRACKET -101
543 #define ONIGERR_EMPTY_CHAR_CLASS -102
544 #define ONIGERR_PREMATURE_END_OF_CHAR_CLASS -103
545 #define ONIGERR_END_PATTERN_AT_ESCAPE -104
546 #define ONIGERR_END_PATTERN_AT_META -105
547 #define ONIGERR_END_PATTERN_AT_CONTROL -106
548 #define ONIGERR_META_CODE_SYNTAX -108
549 #define ONIGERR_CONTROL_CODE_SYNTAX -109
550 #define ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE -110
551 #define ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE -111
552 #define ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS -112
553 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED -113
554 #define ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID -114
555 #define ONIGERR_NESTED_REPEAT_OPERATOR -115
556 #define ONIGERR_UNMATCHED_CLOSE_PARENTHESIS -116
557 #define ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS -117
558 #define ONIGERR_END_PATTERN_IN_GROUP -118
559 #define ONIGERR_UNDEFINED_GROUP_OPTION -119
560 #define ONIGERR_INVALID_POSIX_BRACKET_TYPE -121
561 #define ONIGERR_INVALID_LOOK_BEHIND_PATTERN -122
562 #define ONIGERR_INVALID_REPEAT_RANGE_PATTERN -123
563
564 #define ONIGERR_TOO_BIG_NUMBER -200
565 #define ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE -201
566 #define ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE -202
567 #define ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS -203
568 #define ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE -204
569 #define ONIGERR_TOO_MANY_MULTI_BYTE_RANGES -205
570 #define ONIGERR_TOO_SHORT_MULTI_BYTE_STRING -206
571 #define ONIGERR_TOO_BIG_BACKREF_NUMBER -207
572 #define ONIGERR_INVALID_BACKREF -208
573 #define ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED -209
574 #define ONIGERR_TOO_LONG_WIDE_CHAR_VALUE -212
575 #define ONIGERR_EMPTY_GROUP_NAME -214
576 #define ONIGERR_INVALID_GROUP_NAME -215
577 #define ONIGERR_INVALID_CHAR_IN_GROUP_NAME -216
578 #define ONIGERR_UNDEFINED_NAME_REFERENCE -217
579 #define ONIGERR_UNDEFINED_GROUP_REFERENCE -218
580 #define ONIGERR_MULTIPLEX_DEFINED_NAME -219
581 #define ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL -220
582 #define ONIGERR_NEVER_ENDING_RECURSION -221
583 #define ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY -222
584 #define ONIGERR_INVALID_CHAR_PROPERTY_NAME -223
585 #define ONIGERR_INVALID_CODE_POINT_VALUE -400
586 #define ONIGERR_INVALID_WIDE_CHAR_VALUE -400
587 #define ONIGERR_TOO_BIG_WIDE_CHAR_VALUE -401
588 #define ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION -402
589 #define ONIGERR_INVALID_COMBINATION_OF_OPTIONS -403
590
591
592 #define ONIGERR_OVER_THREAD_PASS_LIMIT_COUNT -1001
593
594
595
596 #define ONIG_MAX_CAPTURE_HISTORY_GROUP 31
597 #define ONIG_IS_CAPTURE_HISTORY_GROUP(r, i) \
598 ((i) <= ONIG_MAX_CAPTURE_HISTORY_GROUP && (r)->list && (r)->list[i])
599
600 typedef struct OnigCaptureTreeNodeStruct {
601 int group;
602 int beg;
603 int end;
604 int allocated;
605 int num_childs;
606 struct OnigCaptureTreeNodeStruct** childs;
607 } OnigCaptureTreeNode;
608
609
610 struct re_registers {
611 int allocated;
612 int num_regs;
613 int* beg;
614 int* end;
615
616 OnigCaptureTreeNode* history_root;
617 };
618
619
620 #define ONIG_TRAVERSE_CALLBACK_AT_FIRST 1
621 #define ONIG_TRAVERSE_CALLBACK_AT_LAST 2
622 #define ONIG_TRAVERSE_CALLBACK_AT_BOTH \
623 ( ONIG_TRAVERSE_CALLBACK_AT_FIRST | ONIG_TRAVERSE_CALLBACK_AT_LAST )
624
625
626 #define ONIG_REGION_NOTPOS -1
627
628 typedef struct re_registers OnigRegion;
629
630 typedef struct {
631 OnigEncoding enc;
632 OnigUChar* par;
633 OnigUChar* par_end;
634 } OnigErrorInfo;
635
636 typedef struct {
637 int lower;
638 int upper;
639 } OnigRepeatRange;
640
641 typedef void (*OnigWarnFunc) P_((const char* s));
642 extern void onig_null_warn P_((const char* s));
643 #define ONIG_NULL_WARN onig_null_warn
644
645 #define ONIG_CHAR_TABLE_SIZE 256
646
647
648 #define ONIG_STATE_NORMAL 0
649 #define ONIG_STATE_SEARCHING 1
650 #define ONIG_STATE_COMPILING -1
651 #define ONIG_STATE_MODIFY -2
652
653 #define ONIG_STATE(reg) \
654 ((reg)->state > 0 ? ONIG_STATE_SEARCHING : (reg)->state)
655
656 typedef struct re_pattern_buffer {
657
658 unsigned char* p;
659 unsigned int used;
660 unsigned int alloc;
661
662 int state;
663 int num_mem;
664 int num_repeat;
665 int num_null_check;
666 int num_comb_exp_check;
667 int num_call;
668 unsigned int capture_history;
669 unsigned int bt_mem_start;
670 unsigned int bt_mem_end;
671 int stack_pop_level;
672 int repeat_range_alloc;
673 OnigRepeatRange* repeat_range;
674
675 OnigEncoding enc;
676 OnigOptionType options;
677 OnigSyntaxType* syntax;
678 OnigCaseFoldType case_fold_flag;
679 void* name_table;
680
681
682 int optimize;
683 int threshold_len;
684 int anchor;
685 OnigDistance anchor_dmin;
686 OnigDistance anchor_dmax;
687 int sub_anchor;
688 unsigned char *exact;
689 unsigned char *exact_end;
690 unsigned char map[ONIG_CHAR_TABLE_SIZE];
691 int *int_map;
692 int *int_map_backward;
693 OnigDistance dmin;
694 OnigDistance dmax;
695
696
697 struct re_pattern_buffer* chain;
698 } OnigRegexType;
699
700 typedef OnigRegexType* OnigRegex;
701
702 #ifndef ONIG_ESCAPE_REGEX_T_COLLISION
703 typedef OnigRegexType regex_t;
704 #endif
705
706
707 typedef struct {
708 int num_of_elements;
709 OnigEncoding pattern_enc;
710 OnigEncoding target_enc;
711 OnigSyntaxType* syntax;
712 OnigOptionType option;
713 OnigCaseFoldType case_fold_flag;
714 } OnigCompileInfo;
715
716
717 ONIG_EXTERN
718 int onig_init P_((void));
719 ONIG_EXTERN
720 int onig_error_code_to_str PV_((OnigUChar* s, int err_code, ...));
721 ONIG_EXTERN
722 void onig_set_warn_func P_((OnigWarnFunc f));
723 ONIG_EXTERN
724 void onig_set_verb_warn_func P_((OnigWarnFunc f));
725 ONIG_EXTERN
726 int onig_new P_((OnigRegex*, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo));
727 ONIG_EXTERN
728 int onig_reg_init P_((regex_t* reg, OnigOptionType option, OnigCaseFoldType case_fold_flag, OnigEncoding enc, OnigSyntaxType* syntax));
729 int onig_new_without_alloc P_((OnigRegex, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo));
730 ONIG_EXTERN
731 int onig_new_deluxe P_((OnigRegex* reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo));
732 ONIG_EXTERN
733 void onig_free P_((OnigRegex));
734 ONIG_EXTERN
735 void onig_free_body P_((OnigRegex));
736 ONIG_EXTERN
737 int onig_recompile P_((OnigRegex, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigOptionType option, OnigEncoding enc, OnigSyntaxType* syntax, OnigErrorInfo* einfo));
738 ONIG_EXTERN
739 int onig_recompile_deluxe P_((OnigRegex reg, const OnigUChar* pattern, const OnigUChar* pattern_end, OnigCompileInfo* ci, OnigErrorInfo* einfo));
740 ONIG_EXTERN
741 int onig_search P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* start, const OnigUChar* range, OnigRegion* region, OnigOptionType option));
742 ONIG_EXTERN
743 int onig_match P_((OnigRegex, const OnigUChar* str, const OnigUChar* end, const OnigUChar* at, OnigRegion* region, OnigOptionType option));
744 ONIG_EXTERN
745 OnigRegion* onig_region_new P_((void));
746 ONIG_EXTERN
747 void onig_region_init P_((OnigRegion* region));
748 ONIG_EXTERN
749 void onig_region_free P_((OnigRegion* region, int free_self));
750 ONIG_EXTERN
751 void onig_region_copy P_((OnigRegion* to, OnigRegion* from));
752 ONIG_EXTERN
753 void onig_region_clear P_((OnigRegion* region));
754 ONIG_EXTERN
755 int onig_region_resize P_((OnigRegion* region, int n));
756 ONIG_EXTERN
757 int onig_region_set P_((OnigRegion* region, int at, int beg, int end));
758 ONIG_EXTERN
759 int onig_name_to_group_numbers P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, int** nums));
760 ONIG_EXTERN
761 int onig_name_to_backref_number P_((OnigRegex reg, const OnigUChar* name, const OnigUChar* name_end, OnigRegion *region));
762 ONIG_EXTERN
763 int onig_foreach_name P_((OnigRegex reg, int (*func)(const OnigUChar*, const OnigUChar*,int,int*,OnigRegex,void*), void* arg));
764 ONIG_EXTERN
765 int onig_number_of_names P_((OnigRegex reg));
766 ONIG_EXTERN
767 int onig_number_of_captures P_((OnigRegex reg));
768 ONIG_EXTERN
769 int onig_number_of_capture_histories P_((OnigRegex reg));
770 ONIG_EXTERN
771 OnigCaptureTreeNode* onig_get_capture_tree P_((OnigRegion* region));
772 ONIG_EXTERN
773 int onig_capture_tree_traverse P_((OnigRegion* region, int at, int(*callback_func)(int,int,int,int,int,void*), void* arg));
774 ONIG_EXTERN
775 int onig_noname_group_capture_is_active P_((OnigRegex reg));
776 ONIG_EXTERN
777 OnigEncoding onig_get_encoding P_((OnigRegex reg));
778 ONIG_EXTERN
779 OnigOptionType onig_get_options P_((OnigRegex reg));
780 ONIG_EXTERN
781 OnigCaseFoldType onig_get_case_fold_flag P_((OnigRegex reg));
782 ONIG_EXTERN
783 OnigSyntaxType* onig_get_syntax P_((OnigRegex reg));
784 ONIG_EXTERN
785 int onig_set_default_syntax P_((OnigSyntaxType* syntax));
786 ONIG_EXTERN
787 void onig_copy_syntax P_((OnigSyntaxType* to, OnigSyntaxType* from));
788 ONIG_EXTERN
789 unsigned int onig_get_syntax_op P_((OnigSyntaxType* syntax));
790 ONIG_EXTERN
791 unsigned int onig_get_syntax_op2 P_((OnigSyntaxType* syntax));
792 ONIG_EXTERN
793 unsigned int onig_get_syntax_behavior P_((OnigSyntaxType* syntax));
794 ONIG_EXTERN
795 OnigOptionType onig_get_syntax_options P_((OnigSyntaxType* syntax));
796 ONIG_EXTERN
797 void onig_set_syntax_op P_((OnigSyntaxType* syntax, unsigned int op));
798 ONIG_EXTERN
799 void onig_set_syntax_op2 P_((OnigSyntaxType* syntax, unsigned int op2));
800 ONIG_EXTERN
801 void onig_set_syntax_behavior P_((OnigSyntaxType* syntax, unsigned int behavior));
802 ONIG_EXTERN
803 void onig_set_syntax_options P_((OnigSyntaxType* syntax, OnigOptionType options));
804 ONIG_EXTERN
805 int onig_set_meta_char P_((OnigSyntaxType* syntax, unsigned int what, OnigCodePoint code));
806 ONIG_EXTERN
807 void onig_copy_encoding P_((OnigEncoding to, OnigEncoding from));
808 ONIG_EXTERN
809 OnigCaseFoldType onig_get_default_case_fold_flag P_((void));
810 ONIG_EXTERN
811 int onig_set_default_case_fold_flag P_((OnigCaseFoldType case_fold_flag));
812 ONIG_EXTERN
813 unsigned int onig_get_match_stack_limit_size P_((void));
814 ONIG_EXTERN
815 int onig_set_match_stack_limit_size P_((unsigned int size));
816 ONIG_EXTERN
817 int onig_end P_((void));
818 ONIG_EXTERN
819 const char* onig_version P_((void));
820 ONIG_EXTERN
821 const char* onig_copyright P_((void));
822
823 #ifdef __cplusplus
824 }
825 #endif
826
827 #endif