ferroni 1.0.0

Pure-Rust Oniguruma regex engine with SIMD-accelerated search
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
// oniguruma.rs - Port of oniguruma.h
// Public types, option flags, error codes, syntax flags, structs.

// === Version ===
pub const ONIGURUMA_VERSION_MAJOR: i32 = 6;
pub const ONIGURUMA_VERSION_MINOR: i32 = 9;
pub const ONIGURUMA_VERSION_TEENY: i32 = 10;
pub const ONIGURUMA_VERSION_INT: i32 = 60910;

// === Grundtypen ===
pub type OnigCodePoint = u32;
pub type OnigUChar = u8;
pub type OnigCtype = u32;
pub type OnigLen = u32;
pub type OnigCaseFoldType = u32;

// OnigOptionType is now a bitflags struct instead of a raw u32 alias.
// All bitwise operations (|, &, !, |=, &=) work as before.
bitflags::bitflags! {
    #[derive(Debug, Clone, Copy, PartialEq, Eq, Hash)]
    pub struct OnigOptionType: u32 {
        const NONE              = 0;
        const IGNORECASE        = 1;
        const EXTEND            = 1 << 1;
        const MULTILINE         = 1 << 2;
        const SINGLELINE        = 1 << 3;
        const FIND_LONGEST      = 1 << 4;
        const FIND_NOT_EMPTY    = 1 << 5;
        const NEGATE_SINGLELINE = 1 << 6;
        const DONT_CAPTURE_GROUP = 1 << 7;
        const CAPTURE_GROUP     = 1 << 8;
        // search time
        const NOTBOL            = 1 << 9;
        const NOTEOL            = 1 << 10;
        const POSIX_REGION      = 1 << 11;
        const CHECK_VALIDITY_OF_STRING = 1 << 12;
        // compile time (continued, gap of 3 bits)
        const IGNORECASE_IS_ASCII = 1 << 15;
        const WORD_IS_ASCII     = 1 << 16;
        const DIGIT_IS_ASCII    = 1 << 17;
        const SPACE_IS_ASCII    = 1 << 18;
        const POSIX_IS_ASCII    = 1 << 19;
        const TEXT_SEGMENT_EXTENDED_GRAPHEME_CLUSTER = 1 << 20;
        const TEXT_SEGMENT_WORD = 1 << 21;
        // search time (continued)
        const NOT_BEGIN_STRING  = 1 << 22;
        const NOT_END_STRING    = 1 << 23;
        const NOT_BEGIN_POSITION = 1 << 24;
        const CALLBACK_EACH_MATCH = 1 << 25;
        const MATCH_WHOLE_STRING = 1 << 26;
    }
}

// === Konstanten ===
pub const ONIG_INFINITE_DISTANCE: OnigLen = OnigLen::MAX;

// === Case Fold Flags ===
pub const ONIGENC_CASE_FOLD_ASCII_ONLY: OnigCaseFoldType = 1;
pub const ONIGENC_CASE_FOLD_TURKISH_AZERI: OnigCaseFoldType = 1 << 20;
pub const INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR: OnigCaseFoldType = 1 << 30;
pub const ONIGENC_CASE_FOLD_MIN: OnigCaseFoldType = INTERNAL_ONIGENC_CASE_FOLD_MULTI_CHAR;

// === Work Size ===
pub const ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN: usize = 3;
pub const ONIGENC_GET_CASE_FOLD_CODES_MAX_NUM: usize = 13;
pub const ONIGENC_CODE_TO_MBC_MAXLEN: usize = 7;
pub const ONIGENC_MBC_CASE_FOLD_MAXLEN: usize = 18;

// === Character Types ===
pub const ONIGENC_CTYPE_NEWLINE: u32 = 0;
pub const ONIGENC_CTYPE_ALPHA: u32 = 1;
pub const ONIGENC_CTYPE_BLANK: u32 = 2;
pub const ONIGENC_CTYPE_CNTRL: u32 = 3;
pub const ONIGENC_CTYPE_DIGIT: u32 = 4;
pub const ONIGENC_CTYPE_GRAPH: u32 = 5;
pub const ONIGENC_CTYPE_LOWER: u32 = 6;
pub const ONIGENC_CTYPE_PRINT: u32 = 7;
pub const ONIGENC_CTYPE_PUNCT: u32 = 8;
pub const ONIGENC_CTYPE_SPACE: u32 = 9;
pub const ONIGENC_CTYPE_UPPER: u32 = 10;
pub const ONIGENC_CTYPE_XDIGIT: u32 = 11;
pub const ONIGENC_CTYPE_WORD: u32 = 12;
pub const ONIGENC_CTYPE_ALNUM: u32 = 13;
pub const ONIGENC_CTYPE_ASCII: u32 = 14;
pub const ONIGENC_MAX_STD_CTYPE: u32 = ONIGENC_CTYPE_ASCII;

// === Case Fold Code Item ===
#[derive(Clone, Debug)]
pub struct OnigCaseFoldCodeItem {
    pub byte_len: i32,
    pub code_len: i32,
    pub code: [OnigCodePoint; ONIGENC_MAX_COMP_CASE_FOLD_CODE_LEN],
}

// === Meta Char Table ===
#[derive(Clone, Debug)]
pub struct OnigMetaCharTableType {
    pub esc: OnigCodePoint,
    pub anychar: OnigCodePoint,
    pub anytime: OnigCodePoint,
    pub zero_or_one_time: OnigCodePoint,
    pub one_or_more_time: OnigCodePoint,
    pub anychar_anytime: OnigCodePoint,
}

// === Config Parameters ===
pub const ONIG_NREGION: usize = 10;
pub const ONIG_MAX_CAPTURE_NUM: i32 = 2147483647;
pub const ONIG_MAX_BACKREF_NUM: i32 = 1000;
pub const ONIG_MAX_REPEAT_NUM: i32 = 100000;
pub const ONIG_MAX_MULTI_BYTE_RANGES_NUM: i32 = 10000;
pub const ONIG_MAX_ERROR_MESSAGE_LEN: usize = 90;

// === Option Flag Aliases ===
// These provide the original C constant names for backward compatibility.
pub const ONIG_OPTION_DEFAULT: OnigOptionType = OnigOptionType::NONE;
pub const ONIG_OPTION_NONE: OnigOptionType = OnigOptionType::NONE;
pub const ONIG_OPTION_IGNORECASE: OnigOptionType = OnigOptionType::IGNORECASE;
pub const ONIG_OPTION_EXTEND: OnigOptionType = OnigOptionType::EXTEND;
pub const ONIG_OPTION_MULTILINE: OnigOptionType = OnigOptionType::MULTILINE;
pub const ONIG_OPTION_SINGLELINE: OnigOptionType = OnigOptionType::SINGLELINE;
pub const ONIG_OPTION_FIND_LONGEST: OnigOptionType = OnigOptionType::FIND_LONGEST;
pub const ONIG_OPTION_FIND_NOT_EMPTY: OnigOptionType = OnigOptionType::FIND_NOT_EMPTY;
pub const ONIG_OPTION_NEGATE_SINGLELINE: OnigOptionType = OnigOptionType::NEGATE_SINGLELINE;
pub const ONIG_OPTION_DONT_CAPTURE_GROUP: OnigOptionType = OnigOptionType::DONT_CAPTURE_GROUP;
pub const ONIG_OPTION_CAPTURE_GROUP: OnigOptionType = OnigOptionType::CAPTURE_GROUP;
pub const ONIG_OPTION_NOTBOL: OnigOptionType = OnigOptionType::NOTBOL;
pub const ONIG_OPTION_NOTEOL: OnigOptionType = OnigOptionType::NOTEOL;
pub const ONIG_OPTION_POSIX_REGION: OnigOptionType = OnigOptionType::POSIX_REGION;
pub const ONIG_OPTION_CHECK_VALIDITY_OF_STRING: OnigOptionType = OnigOptionType::CHECK_VALIDITY_OF_STRING;
pub const ONIG_OPTION_IGNORECASE_IS_ASCII: OnigOptionType = OnigOptionType::IGNORECASE_IS_ASCII;
pub const ONIG_OPTION_WORD_IS_ASCII: OnigOptionType = OnigOptionType::WORD_IS_ASCII;
pub const ONIG_OPTION_DIGIT_IS_ASCII: OnigOptionType = OnigOptionType::DIGIT_IS_ASCII;
pub const ONIG_OPTION_SPACE_IS_ASCII: OnigOptionType = OnigOptionType::SPACE_IS_ASCII;
pub const ONIG_OPTION_POSIX_IS_ASCII: OnigOptionType = OnigOptionType::POSIX_IS_ASCII;
pub const ONIG_OPTION_TEXT_SEGMENT_EXTENDED_GRAPHEME_CLUSTER: OnigOptionType =
    OnigOptionType::TEXT_SEGMENT_EXTENDED_GRAPHEME_CLUSTER;
pub const ONIG_OPTION_TEXT_SEGMENT_WORD: OnigOptionType = OnigOptionType::TEXT_SEGMENT_WORD;
pub const ONIG_OPTION_NOT_BEGIN_STRING: OnigOptionType = OnigOptionType::NOT_BEGIN_STRING;
pub const ONIG_OPTION_NOT_END_STRING: OnigOptionType = OnigOptionType::NOT_END_STRING;
pub const ONIG_OPTION_NOT_BEGIN_POSITION: OnigOptionType = OnigOptionType::NOT_BEGIN_POSITION;
pub const ONIG_OPTION_CALLBACK_EACH_MATCH: OnigOptionType = OnigOptionType::CALLBACK_EACH_MATCH;
pub const ONIG_OPTION_MATCH_WHOLE_STRING: OnigOptionType = OnigOptionType::MATCH_WHOLE_STRING;

pub const ONIG_OPTION_MAXBIT: OnigOptionType = OnigOptionType::MATCH_WHOLE_STRING;

#[inline]
pub fn onig_option_on(options: &mut OnigOptionType, regopt: OnigOptionType) {
    options.insert(regopt);
}

#[inline]
pub fn onig_option_off(options: &mut OnigOptionType, regopt: OnigOptionType) {
    options.remove(regopt);
}

#[inline]
pub fn onig_is_option_on(options: OnigOptionType, option: OnigOptionType) -> bool {
    options.contains(option)
}

// === Syntax Type ===
#[derive(Clone, Debug)]
pub struct OnigSyntaxType {
    pub op: u32,
    pub op2: u32,
    pub behavior: u32,
    pub options: OnigOptionType,
    pub meta_char_table: OnigMetaCharTableType,
}

// === Syntax Operator Flags (op) ===
pub const ONIG_SYN_OP_VARIABLE_META_CHARACTERS: u32 = 1 << 0;
pub const ONIG_SYN_OP_DOT_ANYCHAR: u32 = 1 << 1;
pub const ONIG_SYN_OP_ASTERISK_ZERO_INF: u32 = 1 << 2;
pub const ONIG_SYN_OP_ESC_ASTERISK_ZERO_INF: u32 = 1 << 3;
pub const ONIG_SYN_OP_PLUS_ONE_INF: u32 = 1 << 4;
pub const ONIG_SYN_OP_ESC_PLUS_ONE_INF: u32 = 1 << 5;
pub const ONIG_SYN_OP_QMARK_ZERO_ONE: u32 = 1 << 6;
pub const ONIG_SYN_OP_ESC_QMARK_ZERO_ONE: u32 = 1 << 7;
pub const ONIG_SYN_OP_BRACE_INTERVAL: u32 = 1 << 8;
pub const ONIG_SYN_OP_ESC_BRACE_INTERVAL: u32 = 1 << 9;
pub const ONIG_SYN_OP_VBAR_ALT: u32 = 1 << 10;
pub const ONIG_SYN_OP_ESC_VBAR_ALT: u32 = 1 << 11;
pub const ONIG_SYN_OP_LPAREN_SUBEXP: u32 = 1 << 12;
pub const ONIG_SYN_OP_ESC_LPAREN_SUBEXP: u32 = 1 << 13;
pub const ONIG_SYN_OP_ESC_AZ_BUF_ANCHOR: u32 = 1 << 14;
pub const ONIG_SYN_OP_ESC_CAPITAL_G_BEGIN_ANCHOR: u32 = 1 << 15;
pub const ONIG_SYN_OP_DECIMAL_BACKREF: u32 = 1 << 16;
pub const ONIG_SYN_OP_BRACKET_CC: u32 = 1 << 17;
pub const ONIG_SYN_OP_ESC_W_WORD: u32 = 1 << 18;
pub const ONIG_SYN_OP_ESC_LTGT_WORD_BEGIN_END: u32 = 1 << 19;
pub const ONIG_SYN_OP_ESC_B_WORD_BOUND: u32 = 1 << 20;
pub const ONIG_SYN_OP_ESC_S_WHITE_SPACE: u32 = 1 << 21;
pub const ONIG_SYN_OP_ESC_D_DIGIT: u32 = 1 << 22;
pub const ONIG_SYN_OP_LINE_ANCHOR: u32 = 1 << 23;
pub const ONIG_SYN_OP_POSIX_BRACKET: u32 = 1 << 24;
pub const ONIG_SYN_OP_QMARK_NON_GREEDY: u32 = 1 << 25;
pub const ONIG_SYN_OP_ESC_CONTROL_CHARS: u32 = 1 << 26;
pub const ONIG_SYN_OP_ESC_C_CONTROL: u32 = 1 << 27;
pub const ONIG_SYN_OP_ESC_OCTAL3: u32 = 1 << 28;
pub const ONIG_SYN_OP_ESC_X_HEX2: u32 = 1 << 29;
pub const ONIG_SYN_OP_ESC_X_BRACE_HEX8: u32 = 1 << 30;
pub const ONIG_SYN_OP_ESC_O_BRACE_OCTAL: u32 = 1 << 31;

// === Syntax Operator Flags (op2) ===
pub const ONIG_SYN_OP2_ESC_CAPITAL_Q_QUOTE: u32 = 1 << 0;
pub const ONIG_SYN_OP2_QMARK_GROUP_EFFECT: u32 = 1 << 1;
pub const ONIG_SYN_OP2_OPTION_PERL: u32 = 1 << 2;
pub const ONIG_SYN_OP2_OPTION_RUBY: u32 = 1 << 3;
pub const ONIG_SYN_OP2_PLUS_POSSESSIVE_REPEAT: u32 = 1 << 4;
pub const ONIG_SYN_OP2_PLUS_POSSESSIVE_INTERVAL: u32 = 1 << 5;
pub const ONIG_SYN_OP2_CCLASS_SET_OP: u32 = 1 << 6;
pub const ONIG_SYN_OP2_QMARK_LT_NAMED_GROUP: u32 = 1 << 7;
pub const ONIG_SYN_OP2_ESC_K_NAMED_BACKREF: u32 = 1 << 8;
pub const ONIG_SYN_OP2_ESC_G_SUBEXP_CALL: u32 = 1 << 9;
pub const ONIG_SYN_OP2_ATMARK_CAPTURE_HISTORY: u32 = 1 << 10;
pub const ONIG_SYN_OP2_ESC_CAPITAL_C_BAR_CONTROL: u32 = 1 << 11;
pub const ONIG_SYN_OP2_ESC_CAPITAL_M_BAR_META: u32 = 1 << 12;
pub const ONIG_SYN_OP2_ESC_V_VTAB: u32 = 1 << 13;
pub const ONIG_SYN_OP2_ESC_U_HEX4: u32 = 1 << 14;
pub const ONIG_SYN_OP2_ESC_GNU_BUF_ANCHOR: u32 = 1 << 15;
pub const ONIG_SYN_OP2_ESC_P_BRACE_CHAR_PROPERTY: u32 = 1 << 16;
pub const ONIG_SYN_OP2_ESC_P_BRACE_CIRCUMFLEX_NOT: u32 = 1 << 17;
pub const ONIG_SYN_OP2_ESC_H_XDIGIT: u32 = 1 << 19;
pub const ONIG_SYN_OP2_INEFFECTIVE_ESCAPE: u32 = 1 << 20;
pub const ONIG_SYN_OP2_QMARK_LPAREN_IF_ELSE: u32 = 1 << 21;
pub const ONIG_SYN_OP2_ESC_CAPITAL_K_KEEP: u32 = 1 << 22;
pub const ONIG_SYN_OP2_ESC_CAPITAL_R_GENERAL_NEWLINE: u32 = 1 << 23;
pub const ONIG_SYN_OP2_ESC_CAPITAL_N_O_SUPER_DOT: u32 = 1 << 24;
pub const ONIG_SYN_OP2_QMARK_TILDE_ABSENT_GROUP: u32 = 1 << 25;
pub const ONIG_SYN_OP2_ESC_X_Y_TEXT_SEGMENT: u32 = 1 << 26;
pub const ONIG_SYN_OP2_QMARK_PERL_SUBEXP_CALL: u32 = 1 << 27;
pub const ONIG_SYN_OP2_QMARK_BRACE_CALLOUT_CONTENTS: u32 = 1 << 28;
pub const ONIG_SYN_OP2_ASTERISK_CALLOUT_NAME: u32 = 1 << 29;
pub const ONIG_SYN_OP2_OPTION_ONIGURUMA: u32 = 1 << 30;
pub const ONIG_SYN_OP2_QMARK_CAPITAL_P_NAME: u32 = 1 << 31;

// === Syntax Behavior Flags ===
pub const ONIG_SYN_CONTEXT_INDEP_REPEAT_OPS: u32 = 1 << 0;
pub const ONIG_SYN_CONTEXT_INVALID_REPEAT_OPS: u32 = 1 << 1;
pub const ONIG_SYN_ALLOW_UNMATCHED_CLOSE_SUBEXP: u32 = 1 << 2;
pub const ONIG_SYN_ALLOW_INVALID_INTERVAL: u32 = 1 << 3;
pub const ONIG_SYN_ALLOW_INTERVAL_LOW_ABBREV: u32 = 1 << 4;
pub const ONIG_SYN_STRICT_CHECK_BACKREF: u32 = 1 << 5;
pub const ONIG_SYN_DIFFERENT_LEN_ALT_LOOK_BEHIND: u32 = 1 << 6;
pub const ONIG_SYN_CAPTURE_ONLY_NAMED_GROUP: u32 = 1 << 7;
pub const ONIG_SYN_ALLOW_MULTIPLEX_DEFINITION_NAME: u32 = 1 << 8;
pub const ONIG_SYN_FIXED_INTERVAL_IS_GREEDY_ONLY: u32 = 1 << 9;
pub const ONIG_SYN_ISOLATED_OPTION_CONTINUE_BRANCH: u32 = 1 << 10;
pub const ONIG_SYN_VARIABLE_LEN_LOOK_BEHIND: u32 = 1 << 11;
pub const ONIG_SYN_PYTHON: u32 = 1 << 12;
pub const ONIG_SYN_WHOLE_OPTIONS: u32 = 1 << 13;
pub const ONIG_SYN_BRE_ANCHOR_AT_EDGE_OF_SUBEXP: u32 = 1 << 14;
pub const ONIG_SYN_ESC_P_WITH_ONE_CHAR_PROP: u32 = 1 << 15;
// in char class [...]
pub const ONIG_SYN_NOT_NEWLINE_IN_NEGATIVE_CC: u32 = 1 << 20;
pub const ONIG_SYN_BACKSLASH_ESCAPE_IN_CC: u32 = 1 << 21;
pub const ONIG_SYN_ALLOW_EMPTY_RANGE_IN_CC: u32 = 1 << 22;
pub const ONIG_SYN_ALLOW_DOUBLE_RANGE_OP_IN_CC: u32 = 1 << 23;
pub const ONIG_SYN_WARN_CC_OP_NOT_ESCAPED: u32 = 1 << 24;
pub const ONIG_SYN_WARN_REDUNDANT_NESTED_REPEAT: u32 = 1 << 25;
pub const ONIG_SYN_ALLOW_INVALID_CODE_END_OF_RANGE_IN_CC: u32 = 1 << 26;
pub const ONIG_SYN_ALLOW_CHAR_TYPE_FOLLOWED_BY_MINUS_IN_CC: u32 = 1 << 27;
pub const ONIG_SYN_CONTEXT_INDEP_ANCHORS: u32 = 1 << 31;

// === Meta Char Specifiers ===
pub const ONIG_META_CHAR_ESCAPE: u32 = 0;
pub const ONIG_META_CHAR_ANYCHAR: u32 = 1;
pub const ONIG_META_CHAR_ANYTIME: u32 = 2;
pub const ONIG_META_CHAR_ZERO_OR_ONE_TIME: u32 = 3;
pub const ONIG_META_CHAR_ONE_OR_MORE_TIME: u32 = 4;
pub const ONIG_META_CHAR_ANYCHAR_ANYTIME: u32 = 5;
pub const ONIG_INEFFECTIVE_META_CHAR: OnigCodePoint = 0;

// === Error Codes ===
// normal return
pub const ONIG_NORMAL: i32 = 0;
pub const ONIG_VALUE_IS_NOT_SET: i32 = 1;
pub const ONIG_MISMATCH: i32 = -1;
pub const ONIG_NO_SUPPORT_CONFIG: i32 = -2;
pub const ONIG_ABORT: i32 = -3;

// internal error
pub const ONIGERR_MEMORY: i32 = -5;
pub const ONIGERR_TYPE_BUG: i32 = -6;
pub const ONIGERR_PARSER_BUG: i32 = -11;
pub const ONIGERR_STACK_BUG: i32 = -12;
pub const ONIGERR_UNDEFINED_BYTECODE: i32 = -13;
pub const ONIGERR_UNEXPECTED_BYTECODE: i32 = -14;
pub const ONIGERR_MATCH_STACK_LIMIT_OVER: i32 = -15;
pub const ONIGERR_PARSE_DEPTH_LIMIT_OVER: i32 = -16;
pub const ONIGERR_RETRY_LIMIT_IN_MATCH_OVER: i32 = -17;
pub const ONIGERR_RETRY_LIMIT_IN_SEARCH_OVER: i32 = -18;
pub const ONIGERR_SUBEXP_CALL_LIMIT_IN_SEARCH_OVER: i32 = -19;
pub const ONIGERR_TIME_LIMIT_OVER: i32 = -20;
pub const ONIGERR_DEFAULT_ENCODING_IS_NOT_SET: i32 = -21;
pub const ONIGERR_SPECIFIED_ENCODING_CANT_CONVERT_TO_WIDE_CHAR: i32 = -22;
pub const ONIGERR_FAIL_TO_INITIALIZE: i32 = -23;

// general error
pub const ONIGERR_INVALID_ARGUMENT: i32 = -30;

// syntax error
pub const ONIGERR_END_PATTERN_AT_LEFT_BRACE: i32 = -100;
pub const ONIGERR_END_PATTERN_AT_LEFT_BRACKET: i32 = -101;
pub const ONIGERR_EMPTY_CHAR_CLASS: i32 = -102;
pub const ONIGERR_PREMATURE_END_OF_CHAR_CLASS: i32 = -103;
pub const ONIGERR_END_PATTERN_AT_ESCAPE: i32 = -104;
pub const ONIGERR_END_PATTERN_AT_META: i32 = -105;
pub const ONIGERR_END_PATTERN_AT_CONTROL: i32 = -106;
pub const ONIGERR_META_CODE_SYNTAX: i32 = -108;
pub const ONIGERR_CONTROL_CODE_SYNTAX: i32 = -109;
pub const ONIGERR_CHAR_CLASS_VALUE_AT_END_OF_RANGE: i32 = -110;
pub const ONIGERR_CHAR_CLASS_VALUE_AT_START_OF_RANGE: i32 = -111;
pub const ONIGERR_UNMATCHED_RANGE_SPECIFIER_IN_CHAR_CLASS: i32 = -112;
pub const ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED: i32 = -113;
pub const ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID: i32 = -114;
pub const ONIGERR_NESTED_REPEAT_OPERATOR: i32 = -115;
pub const ONIGERR_UNMATCHED_CLOSE_PARENTHESIS: i32 = -116;
pub const ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS: i32 = -117;
pub const ONIGERR_END_PATTERN_IN_GROUP: i32 = -118;
pub const ONIGERR_UNDEFINED_GROUP_OPTION: i32 = -119;
pub const ONIGERR_INVALID_GROUP_OPTION: i32 = -120;
pub const ONIGERR_INVALID_POSIX_BRACKET_TYPE: i32 = -121;
pub const ONIGERR_INVALID_LOOK_BEHIND_PATTERN: i32 = -122;
pub const ONIGERR_INVALID_REPEAT_RANGE_PATTERN: i32 = -123;

// values error (syntax error)
pub const ONIGERR_TOO_BIG_NUMBER: i32 = -200;
pub const ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE: i32 = -201;
pub const ONIGERR_UPPER_SMALLER_THAN_LOWER_IN_REPEAT_RANGE: i32 = -202;
pub const ONIGERR_EMPTY_RANGE_IN_CHAR_CLASS: i32 = -203;
pub const ONIGERR_MISMATCH_CODE_LENGTH_IN_CLASS_RANGE: i32 = -204;
pub const ONIGERR_TOO_MANY_MULTI_BYTE_RANGES: i32 = -205;
pub const ONIGERR_TOO_SHORT_MULTI_BYTE_STRING: i32 = -206;
pub const ONIGERR_TOO_BIG_BACKREF_NUMBER: i32 = -207;
pub const ONIGERR_INVALID_BACKREF: i32 = -208;
pub const ONIGERR_NUMBERED_BACKREF_OR_CALL_NOT_ALLOWED: i32 = -209;
pub const ONIGERR_TOO_MANY_CAPTURES: i32 = -210;
pub const ONIGERR_TOO_LONG_WIDE_CHAR_VALUE: i32 = -212;
pub const ONIGERR_UNDEFINED_OPERATOR: i32 = -213;
pub const ONIGERR_EMPTY_GROUP_NAME: i32 = -214;
pub const ONIGERR_INVALID_GROUP_NAME: i32 = -215;
pub const ONIGERR_INVALID_CHAR_IN_GROUP_NAME: i32 = -216;
pub const ONIGERR_UNDEFINED_NAME_REFERENCE: i32 = -217;
pub const ONIGERR_UNDEFINED_GROUP_REFERENCE: i32 = -218;
pub const ONIGERR_MULTIPLEX_DEFINED_NAME: i32 = -219;
pub const ONIGERR_MULTIPLEX_DEFINITION_NAME_CALL: i32 = -220;
pub const ONIGERR_NEVER_ENDING_RECURSION: i32 = -221;
pub const ONIGERR_GROUP_NUMBER_OVER_FOR_CAPTURE_HISTORY: i32 = -222;
pub const ONIGERR_INVALID_CHAR_PROPERTY_NAME: i32 = -223;
pub const ONIGERR_INVALID_IF_ELSE_SYNTAX: i32 = -224;
pub const ONIGERR_INVALID_ABSENT_GROUP_PATTERN: i32 = -225;
pub const ONIGERR_INVALID_ABSENT_GROUP_GENERATOR_PATTERN: i32 = -226;
pub const ONIGERR_INVALID_CALLOUT_PATTERN: i32 = -227;
pub const ONIGERR_INVALID_CALLOUT_NAME: i32 = -228;
pub const ONIGERR_UNDEFINED_CALLOUT_NAME: i32 = -229;
pub const ONIGERR_INVALID_CALLOUT_BODY: i32 = -230;
pub const ONIGERR_INVALID_CALLOUT_TAG_NAME: i32 = -231;
pub const ONIGERR_INVALID_CALLOUT_ARG: i32 = -232;
pub const ONIGERR_INVALID_CODE_POINT_VALUE: i32 = -400;
pub const ONIGERR_INVALID_WIDE_CHAR_VALUE: i32 = -400;
pub const ONIGERR_TOO_BIG_WIDE_CHAR_VALUE: i32 = -401;
pub const ONIGERR_NOT_SUPPORTED_ENCODING_COMBINATION: i32 = -402;
pub const ONIGERR_INVALID_COMBINATION_OF_OPTIONS: i32 = -403;
pub const ONIGERR_TOO_MANY_USER_DEFINED_OBJECTS: i32 = -404;
pub const ONIGERR_TOO_LONG_PROPERTY_NAME: i32 = -405;
pub const ONIGERR_VERY_INEFFICIENT_PATTERN: i32 = -406;
pub const ONIGERR_LIBRARY_IS_NOT_INITIALIZED: i32 = -500;

#[inline]
#[cfg_attr(coverage_nightly, coverage(off))]
pub fn onig_is_pattern_error(ecode: i32) -> bool {
    ecode <= -100 && ecode > -1000
}

// === Capture History ===
pub const ONIG_MAX_CAPTURE_HISTORY_GROUP: usize = 31;

// === Capture Tree Node ===
#[derive(Clone)]
pub struct OnigCaptureTreeNode {
    pub group: i32,
    pub beg: i32,
    pub end: i32,
    pub childs: Vec<Box<OnigCaptureTreeNode>>,
}

impl OnigCaptureTreeNode {
    pub fn new() -> Self {
        OnigCaptureTreeNode {
            group: -1,
            beg: ONIG_REGION_NOTPOS,
            end: ONIG_REGION_NOTPOS,
            childs: Vec::new(),
        }
    }

    #[cfg_attr(coverage_nightly, coverage(off))]
    pub fn clear(&mut self) {
        self.childs.clear();
        self.group = -1;
        self.beg = ONIG_REGION_NOTPOS;
        self.end = ONIG_REGION_NOTPOS;
    }

    pub fn add_child(&mut self, child: Box<OnigCaptureTreeNode>) {
        self.childs.push(child);
    }
}

// === OnigRegion (match result) ===
pub struct OnigRegion {
    pub allocated: i32,
    pub num_regs: i32,
    pub beg: Vec<i32>,
    pub end: Vec<i32>,
    pub history_root: Option<Box<OnigCaptureTreeNode>>,
}

impl OnigRegion {
    pub fn new() -> Self {
        OnigRegion {
            allocated: 0,
            num_regs: 0,
            beg: Vec::new(),
            end: Vec::new(),
            history_root: None,
        }
    }

    #[cfg_attr(coverage_nightly, coverage(off))]
    pub fn init(&mut self) {
        self.allocated = 0;
        self.num_regs = 0;
        self.beg.clear();
        self.end.clear();
        self.history_root = None;
    }

    pub fn clear(&mut self) {
        for i in 0..self.num_regs as usize {
            self.beg[i] = ONIG_REGION_NOTPOS;
            self.end[i] = ONIG_REGION_NOTPOS;
        }
        self.history_root = None;
    }

    pub fn resize(&mut self, n: i32) {
        let n = n as usize;
        self.beg.resize(n, ONIG_REGION_NOTPOS);
        self.end.resize(n, ONIG_REGION_NOTPOS);
        self.allocated = n as i32;
        self.num_regs = n as i32;
    }

    #[cfg_attr(coverage_nightly, coverage(off))]
    pub fn set(&mut self, at: i32, beg: i32, end: i32) -> i32 {
        if at < 0 {
            return ONIGERR_INVALID_ARGUMENT;
        }
        if at >= self.allocated {
            self.resize(at + 1);
        }
        self.beg[at as usize] = beg;
        self.end[at as usize] = end;
        ONIG_NORMAL
    }

    #[cfg_attr(coverage_nightly, coverage(off))]
    pub fn copy_from(&mut self, from: &OnigRegion) {
        self.resize(from.num_regs);
        for i in 0..from.num_regs as usize {
            self.beg[i] = from.beg[i];
            self.end[i] = from.end[i];
        }
        self.num_regs = from.num_regs;
        self.history_root = from.history_root.clone();
    }
}

impl Default for OnigRegion {
    #[cfg_attr(coverage_nightly, coverage(off))]
    fn default() -> Self {
        Self::new()
    }
}

// === Capture Traverse Constants ===
pub const ONIG_TRAVERSE_CALLBACK_AT_FIRST: i32 = 1;
pub const ONIG_TRAVERSE_CALLBACK_AT_LAST: i32 = 2;
pub const ONIG_TRAVERSE_CALLBACK_AT_BOTH: i32 =
    ONIG_TRAVERSE_CALLBACK_AT_FIRST | ONIG_TRAVERSE_CALLBACK_AT_LAST;

pub const ONIG_REGION_NOTPOS: i32 = -1;

// === Error Info ===
pub struct OnigErrorInfo {
    pub par: Vec<u8>,
}

// === Repeat Range ===
#[derive(Clone, Debug)]
pub struct OnigRepeatRange {
    pub lower: i32,
    pub upper: i32,
}

// === Char Table Size ===
pub const ONIG_CHAR_TABLE_SIZE: usize = 256;

// === RegSet Lead ===
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(i32)]
pub enum OnigRegSetLead {
    PositionLead = 0,
    RegexLead = 1,
    PriorityToRegexOrder = 2,
}

// === Compile Info ===
pub struct OnigCompileInfo {
    pub num_of_elements: i32,
    pub syntax: *const OnigSyntaxType,
    pub option: OnigOptionType,
    pub case_fold_flag: OnigCaseFoldType,
}

// === Callout Types ===
#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(i32)]
pub enum OnigCalloutIn {
    Progress = 1,
    Retraction = 2,
}

pub const ONIG_CALLOUT_IN_BOTH: i32 =
    OnigCalloutIn::Progress as i32 | OnigCalloutIn::Retraction as i32;

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(i32)]
pub enum OnigCalloutOf {
    Contents = 0,
    Name = 1,
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(i32)]
pub enum OnigCalloutType {
    Single = 0,
    StartCall = 1,
    BothCall = 2,
    StartMarkEndCall = 3,
}

pub const ONIG_NON_NAME_ID: i32 = -1;
pub const ONIG_NON_CALLOUT_NUM: i32 = 0;
pub const ONIG_CALLOUT_MAX_ARGS_NUM: usize = 4;
pub const ONIG_CALLOUT_DATA_SLOT_NUM: usize = 5;

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(i32)]
pub enum OnigCalloutResult {
    Fail = 1,
    Success = 0,
}

#[derive(Clone, Copy, Debug, PartialEq, Eq)]
#[repr(u32)]
pub enum OnigType {
    Void = 0,
    Long = 1 << 0,
    Char = 1 << 1,
    String = 1 << 2,
    Pointer = 1 << 3,
    Tag = 1 << 4,
}

// === OnigValue (C union -> Rust enum) ===
#[derive(Clone, Debug)]
pub enum OnigValue {
    Long(i64),
    Char(OnigCodePoint),
    String { start: Vec<u8> },
    Tag(i32),
    Void,
}

// === Pair Case Fold Codes (from regenc.h) ===
#[derive(Clone, Copy, Debug)]
pub struct OnigPairCaseFoldCodes {
    pub from: OnigCodePoint,
    pub to: OnigCodePoint,
}

// === Code Range ===
#[derive(Clone, Debug)]
pub struct OnigCodeRange {
    pub from: OnigCodePoint,
    pub to: OnigCodePoint,
}

// === Syntax check macros as functions ===
#[inline]
#[cfg_attr(coverage_nightly, coverage(off))]
pub fn is_syntax_op(syntax: &OnigSyntaxType, opm: u32) -> bool {
    (syntax.op & opm) != 0
}

#[inline]
#[cfg_attr(coverage_nightly, coverage(off))]
pub fn is_syntax_op2(syntax: &OnigSyntaxType, opm: u32) -> bool {
    (syntax.op2 & opm) != 0
}

#[inline]
pub fn is_syntax_bv(syntax: &OnigSyntaxType, bvm: u32) -> bool {
    (syntax.behavior & bvm) != 0
}