summaryrefslogtreecommitdiff
path: root/test
diff options
context:
space:
mode:
authorJörg Frings-Fürst <debian@jff.email>2020-04-21 06:47:36 +0200
committerJörg Frings-Fürst <debian@jff.email>2020-04-21 06:47:36 +0200
commita792c4308d32f68f34131ff89e124190e4513c38 (patch)
tree68d5ba9857cafd597ea84011077a83e43f2d1620 /test
parent9e629c8f43b43617fa5b7d3654f7d81e81b8a427 (diff)
parentd1ffcb88ee95aded1bc4aef56f4f39951ad03ceb (diff)
Merge branch 'release/debian/6.9.5-1'debian/6.9.5-1
Diffstat (limited to 'test')
-rw-r--r--test/Makefile.am26
-rw-r--r--test/test_back.c1443
-rw-r--r--test/test_regset.c46
-rw-r--r--test/test_syntax.c246
-rw-r--r--test/test_utf8.c184
-rw-r--r--test/testc.c76
-rw-r--r--test/testp.c614
7 files changed, 2525 insertions, 110 deletions
diff --git a/test/Makefile.am b/test/Makefile.am
index 4d62568..f12eebe 100644
--- a/test/Makefile.am
+++ b/test/Makefile.am
@@ -6,9 +6,9 @@ AM_CFLAGS = -Wall -Wno-invalid-source-encoding
AM_CPPFLAGS = -I$(top_srcdir)/src
if ENABLE_POSIX_API
-TESTS = test_utf8 testc testp testcu test_regset
+TESTS = test_utf8 test_syntax testc testp testcu test_regset test_back
else
-TESTS = test_utf8 testc testcu test_regset
+TESTS = test_utf8 test_syntax testc testcu test_regset test_back
endif
check_PROGRAMS = $(TESTS)
@@ -16,10 +16,12 @@ check_PROGRAMS = $(TESTS)
test: test_uchar $(TESTS)
@echo "[Oniguruma API, UTF-8 check]"
@./test_utf8 | grep RESULT
- @echo "[Oniguruma API, ASCII/EUC-JP check]"
+ @echo "[Oniguruma API, SYNTAX check]"
+ @./test_syntax | grep RESULT
+ @echo "[Oniguruma API, EUC-JP check]"
@./testc | grep RESULT
if ENABLE_POSIX_API
- @echo "[POSIX API, ASCII/EUC-JP check]"
+ @echo "[POSIX API, UTF-8 check]"
@./testp | grep RESULT
endif
@echo "[Oniguruma API, UTF-16 check]"
@@ -27,6 +29,8 @@ endif
@echo ""
@echo "[Oniguruma API, regset check]"
@./test_regset
+ @echo "[Oniguruma API, backward search check]"
+ @./test_back | grep RESULT
test_uchar:
@echo "[UChar in oniguruma.h check]"
@@ -36,13 +40,14 @@ test_uchar:
test_utf8_SOURCES = test_utf8.c
test_utf8_LDADD = $(lib_onig)
+test_syntax_SOURCES = test_syntax.c
+test_syntax_LDADD = $(lib_onig)
+
testc_SOURCES = testc.c
testc_LDADD = $(lib_onig)
-testp_SOURCES = testc.c
+testp_SOURCES = testp.c
testp_LDADD = $(lib_onig)
-testp_CFLAGS = -DPOSIX_TEST -Wall -Wno-invalid-source-encoding
-
testcu_SOURCES = testu.c
testcu_LDADD = $(lib_onig)
@@ -50,10 +55,17 @@ testcu_LDADD = $(lib_onig)
test_regset_SOURCES = test_regset.c
test_regset_LDADD = $(lib_onig)
+test_back_SOURCES = test_back.c
+test_back_LDADD = $(lib_onig)
+
gcov:
make CFLAGS="--coverage" test_utf8
+ make CFLAGS="--coverage" test_syntax
make CFLAGS="--coverage" testc
+if ENABLE_POSIX_API
make CFLAGS="--coverage" testp
+endif
make CFLAGS="--coverage" testcu
make CFLAGS="--coverage" test_regset
+ make CFLAGS="--coverage" test_back
diff --git a/test/test_back.c b/test/test_back.c
new file mode 100644
index 0000000..9a337b9
--- /dev/null
+++ b/test/test_back.c
@@ -0,0 +1,1443 @@
+/*
+ * test_back.c
+ * Copyright (c) 2020 K.Kosako
+ */
+#include "config.h"
+#ifdef ONIG_ESCAPE_UCHAR_COLLISION
+#undef ONIG_ESCAPE_UCHAR_COLLISION
+#endif
+#include <stdio.h>
+
+#include "oniguruma.h"
+
+#include <string.h>
+
+#define SLEN(s) strlen(s)
+
+static int nsucc = 0;
+static int nfail = 0;
+static int nerror = 0;
+
+static FILE* err_file;
+
+static OnigRegion* region;
+
+static void xx(char* pattern, char* str, int from, int to, int mem, int not,
+ int error_no, int line_no)
+{
+ int r;
+ regex_t* reg;
+ OnigErrorInfo einfo;
+
+ r = onig_new(&reg, (UChar* )pattern, (UChar* )(pattern + SLEN(pattern)),
+ ONIG_OPTION_DEFAULT, ONIG_ENCODING_UTF8, ONIG_SYNTAX_DEFAULT, &einfo);
+ if (r) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r, &einfo);
+ fprintf(err_file, "ERROR: %s /%s/ #%d\n", s, pattern, line_no);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ %d #%d\n", pattern, r, line_no);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL(ERROR): /%s/ '%s', %d, %d #%d\n", pattern, str,
+ error_no, r, line_no);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ r = onig_search(reg, (UChar* )str, (UChar* )(str + SLEN(str)),
+ (UChar* )(str + SLEN(str)), (UChar* )str,
+ region, ONIG_OPTION_NONE);
+ if (r < ONIG_MISMATCH) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r);
+ fprintf(err_file, "ERROR: %s /%s/ #%d\n", s, pattern, line_no);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ '%s', %d #%d\n", pattern, str, r, line_no);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL ERROR NO: /%s/ '%s', %d, %d #%d\n", pattern,
+ str, error_no, r, line_no);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ if (r == ONIG_MISMATCH) {
+ if (not) {
+ fprintf(stdout, "OK(N): /%s/ '%s' #%d\n", pattern, str, line_no);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s' #%d\n", pattern, str, line_no);
+ nfail++;
+ }
+ }
+ else {
+ if (not) {
+ fprintf(stdout, "FAIL(N): /%s/ '%s' #%d\n", pattern, str, line_no);
+ nfail++;
+ }
+ else {
+ if (region->beg[mem] == from && region->end[mem] == to) {
+ fprintf(stdout, "OK: /%s/ '%s' #%d\n", pattern, str, line_no);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s' %d-%d : %d-%d #%d\n", pattern, str,
+ from, to, region->beg[mem], region->end[mem], line_no);
+ nfail++;
+ }
+ }
+ }
+ onig_free(reg);
+}
+
+static void xx2(char* pattern, char* str, int from, int to, int line_no)
+{
+ xx(pattern, str, from, to, 0, 0, 0, line_no);
+}
+
+static void xx3(char* pattern, char* str, int from, int to, int mem, int line_no)
+{
+ xx(pattern, str, from, to, mem, 0, 0, line_no);
+}
+
+static void xn(char* pattern, char* str, int line_no)
+{
+ xx(pattern, str, 0, 0, 0, 1, 0, line_no);
+}
+
+static void xe(char* pattern, char* str, int error_no, int line_no)
+{
+ xx(pattern, str, 0, 0, 0, 0, error_no, line_no);
+}
+
+#define x2(p,s,f,t) xx2(p,s,f,t, __LINE__)
+#define x3(p,s,f,t,m) xx3(p,s,f,t,m, __LINE__)
+#define n(p,s) xn(p,s, __LINE__)
+#define e(p,s,e) xe(p,s,e, __LINE__)
+
+extern int main(int argc, char* argv[])
+{
+ OnigEncoding use_encs[1];
+
+ use_encs[0] = ONIG_ENCODING_UTF8;
+ onig_initialize(use_encs, sizeof(use_encs)/sizeof(use_encs[0]));
+
+ err_file = stdout;
+
+ region = onig_region_new();
+
+ x2("", "", 0, 0);
+ x2("^", "", 0, 0);
+ x2("^a", "\na", 1, 2);
+ x2("$", "", 0, 0);
+ x2("$\\O", "bb\n", 2, 3);
+ x2("\\G", "", 0, 0);
+ x2("\\A", "", 0, 0);
+ x2("\\Z", "", 0, 0);
+ x2("\\z", "", 0, 0);
+ x2("^$", "", 0, 0);
+ x2("\\ca", "\001", 0, 1);
+ x2("\\C-b", "\002", 0, 1);
+ x2("\\c\\\\", "\034", 0, 1);
+ x2("q[\\c\\\\]", "q\034", 0, 2);
+ x2("", "a", 1, 1);
+ x2("a", "a", 0, 1);
+ x2("\\x61", "a", 0, 1);
+ x2("aa", "aa", 0, 2);
+ x2("aaa", "aaa", 0, 3);
+ x2("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", 0, 35);
+ x2("ab", "ab", 0, 2);
+ x2("b", "ab", 1, 2);
+ x2("bc", "abc", 1, 3);
+ x2("(?i:#RET#)", "#INS##RET#", 5, 10);
+ x2("\\17", "\017", 0, 1);
+ x2("\\x1f", "\x1f", 0, 1);
+ x2("a(?#....\\\\JJJJ)b", "ab", 0, 2);
+ x2("(?x) G (o O(?-x)oO) g L", "GoOoOgLe", 0, 7);
+ x2(".", "a", 0, 1);
+ n(".", "");
+ x2("..", "ab", 0, 2);
+ x2("\\w", "e", 0, 1);
+ n("\\W", "e");
+ x2("\\s", " ", 0, 1);
+ x2("\\S", "b", 0, 1);
+ x2("\\d", "4", 0, 1);
+ n("\\D", "4");
+ x2("\\b", "z ", 1, 1);
+ x2("\\b", " z", 2, 2);
+ x2("\\b", " z ", 3, 3);
+ x2("\\B", "zz ", 3, 3);
+ x2("\\B", "z ", 2, 2);
+ x2("\\B", " z", 0, 0);
+ x2("[ab]", "b", 0, 1);
+ n("[ab]", "c");
+ x2("[a-z]", "t", 0, 1);
+ n("[^a]", "a");
+ x2("[^a]", "\n", 0, 1);
+ x2("[]]", "]", 0, 1);
+ n("[^]]", "]");
+ x2("[\\^]+", "0^^1", 2, 3);
+ x2("[b-]", "b", 0, 1);
+ x2("[b-]", "-", 0, 1);
+ x2("[\\w]", "z", 0, 1);
+ n("[\\w]", " ");
+ x2("[\\W]", "b$", 1, 2);
+ x2("[\\d]", "5", 0, 1);
+ n("[\\d]", "e");
+ x2("[\\D]", "t", 0, 1);
+ n("[\\D]", "3");
+ x2("[\\s]", " ", 0, 1);
+ n("[\\s]", "a");
+ x2("[\\S]", "b", 0, 1);
+ n("[\\S]", " ");
+ x2("[\\w\\d]", "2", 0, 1);
+ n("[\\w\\d]", " ");
+ x2("[[:upper:]]", "B", 0, 1);
+ x2("[*[:xdigit:]+]", "+", 0, 1);
+ x2("[*[:xdigit:]+]", "GHIKK-9+*", 8, 9);
+ x2("[*[:xdigit:]+]", "-@^+", 3, 4);
+ n("[[:upper]]", "A");
+ x2("[[:upper]]", ":", 0, 1);
+ x2("[\\044-\\047]", "\046", 0, 1);
+ x2("[\\x5a-\\x5c]", "\x5b", 0, 1);
+ x2("[\\x6A-\\x6D]", "\x6c", 0, 1);
+ n("[\\x6A-\\x6D]", "\x6E");
+ n("^[0-9A-F]+ 0+ UNDEF ", "75F 00000000 SECT14A notype () External | _rb_apply");
+ x2("[\\[]", "[", 0, 1);
+ x2("[\\]]", "]", 0, 1);
+ x2("[&]", "&", 0, 1);
+ x2("[[ab]]", "b", 0, 1);
+ x2("[[ab]c]", "c", 0, 1);
+ n("[[^a]]", "a");
+ n("[^[a]]", "a");
+ x2("[[ab]&&bc]", "b", 0, 1);
+ n("[[ab]&&bc]", "a");
+ n("[[ab]&&bc]", "c");
+ x2("[a-z&&b-y&&c-x]", "w", 0, 1);
+ n("[^a-z&&b-y&&c-x]", "w");
+ x2("[[^a&&a]&&a-z]", "b", 0, 1);
+ n("[[^a&&a]&&a-z]", "a");
+ x2("[[^a-z&&bcdef]&&[^c-g]]", "h", 0, 1);
+ n("[[^a-z&&bcdef]&&[^c-g]]", "c");
+ x2("[^[^abc]&&[^cde]]", "c", 0, 1);
+ x2("[^[^abc]&&[^cde]]", "e", 0, 1);
+ n("[^[^abc]&&[^cde]]", "f");
+ x2("[a-&&-a]", "-", 0, 1);
+ n("[a\\-&&\\-a]", "&");
+ n("\\wabc", " abc");
+ x2("a\\Wbc", "a bc", 0, 4);
+ x2("a.b.c", "aabbc", 0, 5);
+ x2(".\\wb\\W..c", "abb bcc", 0, 7);
+ x2("\\s\\wzzz", " zzzz", 0, 5);
+ x2("aa.b", "aabb", 0, 4);
+ n(".a", "ab");
+ x2(".a", "aa", 0, 2);
+ x2("^a", "a", 0, 1);
+ x2("^a$", "a", 0, 1);
+ x2("^\\w$", "a", 0, 1);
+ n("^\\w$", " ");
+ x2("^\\wab$", "zab", 0, 3);
+ x2("^\\wabcdef$", "zabcdef", 0, 7);
+ x2("^\\w...def$", "zabcdef", 0, 7);
+ x2("\\w\\w\\s\\Waaa\\d", "aa aaa4", 0, 8);
+ x2("\\A\\Z", "", 0, 0);
+ x2("\\Axyz", "xyz", 0, 3);
+ x2("xyz\\Z", "xyz", 0, 3);
+ x2("xyz\\z", "xyz", 0, 3);
+ x2("a\\Z", "a", 0, 1);
+ n("\\Gaz", "az");
+ n("\\Gz", "bza");
+ x2("az\\G", "az", 0, 2);
+ n("az\\A", "az");
+ n("a\\Az", "az");
+ x2("\\^\\$", "^$", 0, 2);
+ x2("^x?y", "xy", 0, 2);
+ x2("^(x?y)", "xy", 0, 2);
+ x2("\\w", "_", 0, 1);
+ n("\\W", "_");
+ x2("(?=z)z", "z", 0, 1);
+ n("(?=z).", "a");
+ x2("(?!z)a", "a", 0, 1);
+ n("(?!z)a", "z");
+ x2("(?i:a)", "a", 0, 1);
+ x2("(?i:a)", "A", 0, 1);
+ x2("(?i:A)", "a", 0, 1);
+ x2("(?i:i)", "I", 0, 1);
+ x2("(?i:I)", "i", 0, 1);
+ x2("(?i:[A-Z])", "i", 0, 1);
+ x2("(?i:[a-z])", "I", 0, 1);
+ n("(?i:A)", "b");
+ x2("(?i:ss)", "ss", 0, 2);
+ x2("(?i:ss)", "Ss", 0, 2);
+ x2("(?i:ss)", "SS", 0, 2);
+ /* 0xc5,0xbf == 017F: # LATIN SMALL LETTER LONG S */
+ x2("(?i:ss)", "\xc5\xbfS", 0, 3);
+ x2("(?i:ss)", "s\xc5\xbf", 0, 3);
+ /* 0xc3,0x9f == 00DF: # LATIN SMALL LETTER SHARP S */
+ x2("(?i:ss)", "\xc3\x9f", 0, 2);
+ /* 0xe1,0xba,0x9e == 1E9E # LATIN CAPITAL LETTER SHARP S */
+ x2("(?i:ss)", "\xe1\xba\x9e", 0, 3);
+ x2("(?i:xssy)", "xssy", 0, 4);
+ x2("(?i:xssy)", "xSsy", 0, 4);
+ x2("(?i:xssy)", "xSSy", 0, 4);
+ x2("(?i:xssy)", "x\xc5\xbfSy", 0, 5);
+ x2("(?i:xssy)", "xs\xc5\xbfy", 0, 5);
+ x2("(?i:xssy)", "x\xc3\x9fy", 0, 4);
+ x2("(?i:xssy)", "x\xe1\xba\x9ey", 0, 5);
+ x2("(?i:x\xc3\x9fy)", "xssy", 0, 4);
+ x2("(?i:x\xc3\x9fy)", "xSSy", 0, 4);
+ x2("(?i:\xc3\x9f)", "ss", 0, 2);
+ x2("(?i:\xc3\x9f)", "SS", 0, 2);
+ x2("(?i:[\xc3\x9f])", "ss", 0, 2);
+ x2("(?i:[\xc3\x9f])", "SS", 0, 2);
+ x2("(?i)(?<!ss)z", "qqz", 2, 3);
+ x2("(?i:[A-Z])", "a", 0, 1);
+ x2("(?i:[f-m])", "H", 0, 1);
+ x2("(?i:[f-m])", "h", 0, 1);
+ n("(?i:[f-m])", "e");
+ x2("(?i:[A-c])", "D", 0, 1);
+ n("(?i:[^a-z])", "A");
+ n("(?i:[^a-z])", "a");
+ x2("(?i:[!-k])", "Z", 0, 1);
+ x2("(?i:[!-k])", "7", 0, 1);
+ x2("(?i:[T-}])", "b", 0, 1);
+ x2("(?i:[T-}])", "{", 0, 1);
+ x2("(?i:\\?a)", "?A", 0, 2);
+ x2("(?i:\\*A)", "*a", 0, 2);
+ n(".", "\n");
+ x2("(?m:.)", "\n", 0, 1);
+ x2("(?m:a.)", "a\n", 0, 2);
+ x2("(?m:.b)", "a\nb", 1, 3);
+ x2(".*abc", "dddabdd\nddabc", 10, 13);
+ x2(".+abc", "dddabdd\nddabcaa\naaaabc", 18, 22);
+ x2("(?m:.*abc)", "dddabddabc", 7, 10);
+ n("(?i)(?-i)a", "A");
+ n("(?i)(?-i:a)", "A");
+ x2("a?", "", 0, 0);
+ x2("a?", "b", 1, 1);
+ x2("a?", "a", 1, 1);
+ x2("a*", "", 0, 0);
+ x2("a*", "a", 1, 1);
+ x2("a*", "aaa", 3, 3);
+ x2("a*", "baaaa", 5, 5);
+ n("a+", "");
+ x2("a+", "a", 0, 1);
+ x2("a+", "aaaa", 3, 4);
+ x2("a+", "aabbb", 1, 2);
+ x2("a+", "baaaa", 4, 5);
+ x2(".?", "", 0, 0);
+ x2(".?", "f", 1, 1);
+ x2(".?", "\n", 1, 1);
+ x2(".*", "", 0, 0);
+ x2(".*", "abcde", 5, 5);
+ x2(".+", "z", 0, 1);
+ x2(".+", "zdswer\n", 5, 6);
+ x2("(.*)a\\1f", "babfbac", 0, 4);
+ x2("(.*)a\\1f", "bacbabf", 3, 7);
+ x2("((.*)a\\2f)", "bacbabf", 3, 7);
+ x2("(.*)a\\1f", "baczzzzzz\nbazz\nzzzzbabf", 19, 23);
+ x2("a|b", "a", 0, 1);
+ x2("a|b", "b", 0, 1);
+ x2("|a", "a", 1, 1);
+ x2("(|a)", "a", 1, 1);
+ x2("ab|bc", "ab", 0, 2);
+ x2("ab|bc", "bc", 0, 2);
+ x2("z(?:ab|bc)", "zbc", 0, 3);
+ x2("a(?:ab|bc)c", "aabc", 0, 4);
+ x2("ab|(?:ac|az)", "az", 0, 2);
+ x2("a|b|c", "dc", 1, 2);
+ x2("a|b|cd|efg|h|ijk|lmn|o|pq|rstuvwx|yz", "pqr", 0, 2);
+ n("a|b|cd|efg|h|ijk|lmn|o|pq|rstuvwx|yz", "mn");
+ x2("a|^z", "ba", 1, 2);
+ x2("a|^z", "za", 1, 2);
+ x2("a|\\Gz", "bza", 2, 3);
+ x2("a|\\Gz", "za", 1, 2);
+ x2("a|\\Az", "bza", 2, 3);
+ x2("a|\\Az", "za", 1, 2);
+ x2("a|b\\Z", "ba", 1, 2);
+ x2("a|b\\Z", "b", 0, 1);
+ x2("a|b\\z", "ba", 1, 2);
+ x2("a|b\\z", "b", 0, 1);
+ x2("\\w|\\s", " ", 0, 1);
+ n("\\w|\\w", " ");
+ x2("\\w|%", "%", 0, 1);
+ x2("\\w|[&$]", "&", 0, 1);
+ x2("[b-d]|[^e-z]", "a", 0, 1);
+ x2("(?:a|[c-f])|bz", "dz", 0, 1);
+ x2("(?:a|[c-f])|bz", "bz", 0, 2);
+ x2("abc|(?=zz)..f", "zzf", 0, 3);
+ x2("abc|(?!zz)..f", "abf", 0, 3);
+ x2("(?=za)..a|(?=zz)..a", "zza", 0, 3);
+ n("(?>a|abd)c", "abdc");
+ x2("(?>abd|a)c", "abdc", 0, 4);
+ x2("a?|b", "a", 1, 1);
+ x2("a?|b", "b", 1, 1);
+ x2("a?|b", "", 0, 0);
+ x2("a*|b", "aa", 2, 2);
+ x2("a*|b*", "ba", 2, 2);
+ x2("a*|b*", "ab", 2, 2);
+ x2("a+|b*", "", 0, 0);
+ x2("a+|b*", "bbb", 3, 3);
+ x2("a+|b*", "abbb", 4, 4);
+ n("a+|b+", "");
+ x2("(a|b)?", "b", 1, 1);
+ x2("(a|b)*", "ba", 2, 2);
+ x2("(a|b)+", "bab", 2, 3);
+ x2("(ab|ca)+", "caabbc", 2, 4);
+ x2("(ab|ca)+", "aabca", 3, 5);
+ x2("(ab|ca)+", "abzca", 3, 5);
+ x2("(a|bab)+", "ababa", 4, 5);
+ x2("(a|bab)+", "ba", 1, 2);
+ x2("(a|bab)+", "baaaba", 5, 6);
+ x2("(?:a|b)(?:a|b)", "ab", 0, 2);
+ x2("(?:a*|b*)(?:a*|b*)", "aaabbb", 6, 6);
+ x2("(?:a*|b*)(?:a+|b+)", "aaabbb", 5, 6);
+ x2("(?:a+|b+){2}", "aaabbb", 4, 6);
+ x2("h{0,}", "hhhh", 4, 4);
+ x2("(?:a+|b+){1,2}", "aaabbb", 5, 6);
+ n("ax{2}*a", "0axxxa1");
+ n("a.{0,2}a", "0aXXXa0");
+ n("a.{0,2}?a", "0aXXXa0");
+ n("a.{0,2}?a", "0aXXXXa0");
+ x2("^a{2,}?a$", "aaa", 0, 3);
+ x2("^[a-z]{2,}?$", "aaa", 0, 3);
+ x2("(?:a+|\\Ab*)cc", "cc", 0, 2);
+ n("(?:a+|\\Ab*)cc", "abcc");
+ x2("(?:^a+|b+)*c", "aabbbabc", 7, 8);
+ x2("(?:^a+|b+)*c", "aabbbbc", 6, 7);
+ x2("a|(?i)c", "C", 0, 1);
+ x2("(?i)c|a", "C", 0, 1);
+ x2("(?i)c|a", "A", 0, 1);
+ x2("a(?i)b|c", "aB", 0, 2);
+ x2("a(?i)b|c", "aC", 0, 2);
+ n("a(?i)b|c", "AC");
+ n("a(?:(?i)b)|c", "aC");
+ x2("(?i:c)|a", "C", 0, 1);
+ n("(?i:c)|a", "A");
+ x2("[abc]?", "abc", 3, 3);
+ x2("[abc]*", "abc", 3, 3);
+ x2("[^abc]*", "abc", 3, 3);
+ n("[^abc]+", "abc");
+ x2("a?\?", "aaa", 3, 3);
+ x2("ba?\?b", "bab", 0, 3);
+ x2("a*?", "aaa", 3, 3);
+ x2("ba*?", "baa", 0, 1);
+ x2("ba*?b", "baab", 0, 4);
+ x2("a+?", "aaa", 2, 3);
+ x2("ba+?", "baa", 0, 2);
+ x2("ba+?b", "baab", 0, 4);
+ x2("(?:a?)?\?", "a", 1, 1);
+ x2("(?:a?\?)?", "a", 1, 1);
+ x2("(?:a?)+?", "aaa", 3, 3);
+ x2("(?:a+)?\?", "aaa", 3, 3);
+ x2("(?:a+)?\?b", "aaab", 3, 4);
+ x2("(?:ab)?{2}", "", 0, 0);
+ x2("(?:ab)?{2}", "ababa", 5, 5);
+ x2("(?:ab)*{0}", "ababa", 5, 5);
+ x2("(?:ab){3,}", "abababab", 2, 8);
+ n("(?:ab){3,}", "abab");
+ x2("(?:ab){2,4}", "ababab", 2, 6);
+ x2("(?:ab){2,4}", "ababababab", 6, 10);
+ x2("(?:ab){2,4}?", "ababababab", 6, 10);
+ x2("(?:ab){,}", "ab{,}", 0, 5);
+ x2("(?:abc)+?{2}", "abcabcabc", 3, 9);
+ x2("(?:X*)(?i:xa)", "XXXa", 2, 4);
+ x2("(d+)([^abc]z)", "dddz", 1, 4);
+ x2("([^abc]*)([^abc]z)", "dddz", 2, 4);
+ x2("(\\w+)(\\wz)", "dddz", 1, 4);
+ x3("(a)", "a", 0, 1, 1);
+ x3("(ab)", "ab", 0, 2, 1);
+ x2("((ab))", "ab", 0, 2);
+ x3("((ab))", "ab", 0, 2, 1);
+ x3("((ab))", "ab", 0, 2, 2);
+ x3("((((((((((((((((((((ab))))))))))))))))))))", "ab", 0, 2, 20);
+ x3("(ab)(cd)", "abcd", 0, 2, 1);
+ x3("(ab)(cd)", "abcd", 2, 4, 2);
+ x3("()(a)bc(def)ghijk", "abcdefghijk", 3, 6, 3);
+ x3("(()(a)bc(def)ghijk)", "abcdefghijk", 3, 6, 4);
+ x2("(^a)", "a", 0, 1);
+ x3("(a)|(a)", "ba", 1, 2, 1);
+ x3("(^a)|(a)", "ba", 1, 2, 2);
+ x3("(a?)", "aaa", 3, 3, 1);
+ x3("(a*)", "aaa", 3, 3, 1);
+ x3("(a*)", "", 0, 0, 1);
+ x3("(a+)", "aaaaaaa", 6, 7, 1);
+ x3("(a+|b*)", "bbbaa", 5, 5, 1);
+ x3("(a+|b?)", "bbbaa", 5, 5, 1);
+ x3("(abc)?", "abc", -1, -1, 1);
+ x3("(abc)*", "abc", -1, -1, 1);
+ x3("(abc)+", "abc", 0, 3, 1);
+ x3("(xyz|abc)+", "abc", 0, 3, 1);
+ x3("([xyz][abc]|abc)+", "abc", 0, 3, 1);
+ x3("((?i:abc))", "AbC", 0, 3, 1);
+ x2("(abc)(?i:\\1)", "abcABC", 0, 6);
+ x3("((?m:a.c))", "a\nc", 0, 3, 1);
+ x3("((?=az)a)", "azb", 0, 1, 1);
+ x3("abc|(.abd)", "zabd", 0, 4, 1);
+ x2("(?:abc)|(ABC)", "abc", 0, 3);
+ x3("(?i:(abc))|(zzz)", "ABC", 0, 3, 1);
+ x3("a*(.)", "aaaaz", 4, 5, 1);
+ x3("a*?(.)", "aaaaz", 4, 5, 1);
+ x3("a*?(c)", "aaaac", 4, 5, 1);
+ x3("[bcd]a*(.)", "caaaaz", 5, 6, 1);
+ x3("(\\Abb)cc", "bbcc", 0, 2, 1);
+ n("(\\Abb)cc", "zbbcc");
+ x3("(^bb)cc", "bbcc", 0, 2, 1);
+ n("(^bb)cc", "zbbcc");
+ x3("cc(bb$)", "ccbb", 2, 4, 1);
+ n("cc(bb$)", "ccbbb");
+ n("(\\1)", "");
+ n("\\1(a)", "aa");
+ n("(a(b)\\1)\\2+", "ababb");
+ n("(?:(?:\\1|z)(a))+$", "zaa");
+ x2("(?:(?:\\1|z)(a))+$", "zaaa", 0, 4);
+ x2("(a)(?=\\1)", "aa", 0, 1);
+ n("(a)$|\\1", "az");
+ x2("(a)\\1", "aa", 0, 2);
+ n("(a)\\1", "ab");
+ x2("(a?)\\1", "aa", 2, 2);
+ x2("(a?\?)\\1", "aa", 2, 2);
+ x2("(a*)\\1", "aaaaa", 5, 5);
+ x3("(a*)\\1", "aaaaa", 5, 5, 1);
+ x2("a(b*)\\1", "abbbb", 0, 5);
+ x2("a(b*)\\1", "ab", 0, 1);
+ x2("(a*)(b*)\\1\\2", "aaabbaaabb", 10, 10);
+ x2("(a*)(b*)\\2", "aaabbbb", 7, 7);
+ x2("(((((((a*)b))))))c\\7", "aaabcaaa", 3, 5);
+ x3("(((((((a*)b))))))c\\7", "aaabcaaa", 3, 3, 7);
+ x2("(a)(b)(c)\\2\\1\\3", "abcbac", 0, 6);
+ x2("([a-d])\\1", "cc", 0, 2);
+ x2("(\\w\\d\\s)\\1", "f5 f5 ", 0, 6);
+ n("(\\w\\d\\s)\\1", "f5 f5");
+ x2("(who|[a-c]{3})\\1", "whowho", 0, 6);
+ x2("...(who|[a-c]{3})\\1", "abcwhowho", 0, 9);
+ x2("(who|[a-c]{3})\\1", "cbccbc", 0, 6);
+ x2("(^a)\\1", "aa", 0, 2);
+ n("(^a)\\1", "baa");
+ n("(a$)\\1", "aa");
+ n("(ab\\Z)\\1", "ab");
+ x2("(a*\\Z)\\1", "a", 1, 1);
+ x2(".(a*\\Z)\\1", "ba", 1, 2);
+ x3("(.(abc)\\2)", "zabcabc", 0, 7, 1);
+ x3("(.(..\\d.)\\2)", "z12341234", 0, 9, 1);
+ x2("((?i:az))\\1", "AzAz", 0, 4);
+ n("((?i:az))\\1", "Azaz");
+ x2("(?<=a)b", "ab", 1, 2);
+ n("(?<=a)b", "bb");
+ x2("(?<=a|b)b", "bb", 1, 2);
+ x2("(?<=a|bc)b", "bcb", 2, 3);
+ x2("(?<=a|bc)b", "ab", 1, 2);
+ x2("(?<=a|bc||defghij|klmnopq|r)z", "rz", 1, 2);
+ x3("(?<=(abc))d", "abcd", 0, 3, 1);
+ x2("(?<=(?i:abc))d", "ABCd", 3, 4);
+ x2("(a)\\g<1>", "aa", 0, 2);
+ x2("(?<!a)b", "cb", 1, 2);
+ n("(?<!a)b", "ab");
+ x2("(?<!a|bc)b", "bbb", 2, 3);
+ n("(?<!a|bc)z", "bcz");
+ x2("(?<name1>a)", "a", 0, 1);
+ x2("(?<name_2>ab)\\g<name_2>", "abab", 0, 4);
+ x2("(?<name_3>.zv.)\\k<name_3>", "azvbazvb", 0, 8);
+ x2("(?<=\\g<ab>)|-\\zEND (?<ab>XyZ)", "XyZ", 3, 3);
+ x2("(?<n>|a\\g<n>)+", "", 0, 0);
+ x2("(?<n>|\\(\\g<n>\\))+$", "()(())", 6, 6);
+ x3("\\g<n>(?<n>.){0}", "X", 0, 1, 1);
+ x2("\\g<n>(abc|df(?<n>.YZ){2,8}){0}", "XYZ", 0, 3);
+ x2("\\A(?<n>(a\\g<n>)|)\\z", "aaaa", 0, 4);
+ x2("(?<n>|\\g<m>\\g<n>)\\z|\\zEND (?<m>a|(b)\\g<m>)", "bbbbabba", 8, 8);
+ x2("(?<name1240>\\w+\\sx)a+\\k<name1240>", " fg xaaaaaaaafg x", 2, 18);
+ x3("(z)()()(?<_9>a)\\g<_9>", "zaa", 2, 3, 1);
+ x2("(.)(((?<_>a)))\\k<_>", "zaa", 0, 3);
+ x2("((?<name1>\\d)|(?<name2>\\w))(\\k<name1>|\\k<name2>)", "ff", 0, 2);
+ x2("(?:(?<x>)|(?<x>efg))\\k<x>", "", 0, 0);
+ x2("(?:(?<x>abc)|(?<x>efg))\\k<x>", "abcefgefg", 3, 9);
+ n("(?:(?<x>abc)|(?<x>efg))\\k<x>", "abcefg");
+ x2("(?:(?<n1>.)|(?<n1>..)|(?<n1>...)|(?<n1>....)|(?<n1>.....)|(?<n1>......)|(?<n1>.......)|(?<n1>........)|(?<n1>.........)|(?<n1>..........)|(?<n1>...........)|(?<n1>............)|(?<n1>.............)|(?<n1>..............))\\k<n1>$", "a-pyumpyum", 2, 10);
+ x3("(?:(?<n1>.)|(?<n1>..)|(?<n1>...)|(?<n1>....)|(?<n1>.....)|(?<n1>......)|(?<n1>.......)|(?<n1>........)|(?<n1>.........)|(?<n1>..........)|(?<n1>...........)|(?<n1>............)|(?<n1>.............)|(?<n1>..............))\\k<n1>$", "xxxxabcdefghijklmnabcdefghijklmn", 4, 18, 14);
+ x3("(?<name1>)(?<name2>)(?<name3>)(?<name4>)(?<name5>)(?<name6>)(?<name7>)(?<name8>)(?<name9>)(?<name10>)(?<name11>)(?<name12>)(?<name13>)(?<name14>)(?<name15>)(?<name16>aaa)(?<name17>)$", "aaa", 0, 3, 16);
+ x2("(?<foo>a|\\(\\g<foo>\\))", "a", 0, 1);
+ x2("(?<foo>a|\\(\\g<foo>\\))", "((((((a))))))", 6, 7);
+ x3("(?<foo>a|\\(\\g<foo>\\))", "((((((((a))))))))", 8, 9, 1);
+ x2("\\g<bar>|\\zEND(?<bar>.*abc$)", "abcxxxabc", 6, 9);
+ x2("\\g<1>|\\zEND(.a.)", "bac", 0, 3);
+ x3("\\g<_A>\\g<_A>|\\zEND(.a.)(?<_A>.b.)", "xbxyby", 3, 6, 1);
+ x2("\\A(?:\\g<pon>|\\g<pan>|\\zEND (?<pan>a|c\\g<pon>c)(?<pon>b|d\\g<pan>d))$", "cdcbcdc", 0, 7);
+ x2("\\A(?<n>|a\\g<m>)\\z|\\zEND (?<m>\\g<n>)", "aaaa", 0, 4);
+ x2("(?<n>(a|b\\g<n>c){3,5})", "baaaaca", 2, 5);
+ x2("(?<n>(a|b\\g<n>c){3,5})", "baaaacaaaaa", 8, 11);
+ x2("(?<pare>\\(([^\\(\\)]++|\\g<pare>)*+\\))", "((a))", 1, 4);
+ x2("()*\\1", "", 0, 0);
+ x2("(?:()|())*\\1\\2", "", 0, 0);
+ x2("(?:a*|b*)*c", "abadc", 4, 5);
+ x3("(?:\\1a|())*", "a", 1, 1, 1);
+ x2("x((.)*)*x", "0x1x2x3", 3, 6);
+ x2("x((.)*)*x(?i:\\1)\\Z", "0x1x2x1X2", 1, 9);
+ x2("(?:()|()|()|()|()|())*\\2\\5", "", 0, 0);
+ x2("(?:()|()|()|(x)|()|())*\\2b\\5", "b", 0, 1);
+ x2("[0-9-a]", "-", 0, 1); // PR#44
+ n("[0-9-a]", ":"); // PR#44
+ x3("(\\(((?:[^(]|\\g<1>)*)\\))", "(abc)(abc)", 6, 9, 2); // PR#43
+ x2("\\o{101}", "A", 0, 1);
+ x2("\\A(a|b\\g<1>c)\\k<1+3>\\z", "bbacca", 0, 6);
+ n("\\A(a|b\\g<1>c)\\k<1+3>\\z", "bbaccb");
+ x2("(?i)\\A(a|b\\g<1>c)\\k<1+2>\\z", "bBACcbac", 0, 8);
+ x2("(?i)(?<X>aa)|(?<X>bb)\\k<X>", "BBbb", 0, 4);
+ x2("(?:\\k'+1'B|(A)C)*", "ACAB", 4, 4); // relative backref by postitive number
+ x2("\\g<+2>(abc)(ABC){0}", "ABCabc", 0, 6); // relative call by positive number
+ x2("A\\g'0'|B()", "AAAAB", 4, 5);
+ x3("(A\\g'0')|B", "AAAAB", -1, -1, 1);
+ x2("(a*)(?(1))aa", "aaaaa", 3, 5);
+ x2("(a*)(?(-1))aa", "aaaaa", 3, 5);
+ x2("(?<name>aaa)(?('name'))aa", "aaaaa", 0, 5);
+ x2("(a)(?(1)aa|bb)a", "aaaaa", 1, 5);
+ x2("(?:aa|())(?(<1>)aa|bb)a", "aabba", 0, 5);
+ x2("(?:aa|())(?('1')aa|bb|cc)a", "aacca", 0, 5);
+ x3("(a*)(?(1)aa|a)b", "aaab", 1, 1, 1);
+ n("(a)(?(1)a|b)c", "abc");
+ x2("(a)(?(1)|)c", "ac", 0, 2);
+ n("(?()aaa|bbb)", "bbb");
+ x2("(a)(?(1+0)b|c)d", "abd", 0, 3);
+ x2("(?:(?'name'a)|(?'name'b))(?('name')c|d)e", "ace", 0, 3);
+ x2("(?:(?'name'a)|(?'name'b))(?('name')c|d)e", "bce", 0, 3);
+ x2("\\R", "\r\n", 1, 2);
+ x2("\\R", "\r", 0, 1);
+ x2("\\R", "\n", 0, 1);
+ x2("\\R", "\x0b", 0, 1);
+ n("\\R\\n", "\r\n");
+ x2("\\R", "\xc2\x85", 0, 2);
+ x2("\\N", "a", 0, 1);
+ n("\\N", "\n");
+ n("(?m:\\N)", "\n");
+ n("(?-m:\\N)", "\n");
+ x2("\\O", "a", 0, 1);
+ x2("\\O", "\n", 0, 1);
+ x2("(?m:\\O)", "\n", 0, 1);
+ x2("(?-m:\\O)", "\n", 0, 1);
+ x2("\\K", "a", 1, 1);
+ x2("a\\K", "a", 1, 1);
+ x2("a\\Kb", "ab", 1, 2);
+ x2("(a\\Kb|ac\\Kd)", "acd", 2, 3);
+ x2("(a\\Kb|\\Kac\\K)*", "acababacab", 10, 10);
+ x2("(?:()|())*\\1", "abc", 3, 3);
+ x2("(?:()|())*\\2", "abc", 3, 3);
+ x2("(?:()|()|())*\\3\\1", "abc", 3, 3);
+ x2("(|(?:a(?:\\g'1')*))b|", "abc", 3, 3);
+ x2("^(\"|)(.*)\\1$", "XX", 0, 2);
+ x2("(abc|def|ghi|jkl|mno|pqr|stu){0,10}?\\z", "admno", 5, 5);
+ x2("(abc|(def|ghi|jkl|mno|pqr){0,7}?){5}\\z", "adpqrpqrpqr", 11, 11); // cover OP_REPEAT_INC_NG_SG
+ x2("(?!abc).*\\z", "abcde", 5, 5); // cover OP_PREC_READ_NOT_END
+ x2("(.{2,})?", "abcde", 5, 5); // up coverage
+ x2("((a|b|c|d|e|f|g|h|i|j|k|l|m|n)+)?", "abcde", 5, 5); // up coverage
+ x2("((a|b|c|d|e|f|g|h|i|j|k|l|m|n){3,})?", "abcde", 5, 5); // up coverage
+ x2("((?:a(?:b|c|d|e|f|g|h|i|j|k|l|m|n))+)?", "abacadae", 8, 8); // up coverage
+ x2("((?:a(?:b|c|d|e|f|g|h|i|j|k|l|m|n))+?)?z", "abacadaez", 8, 9); // up coverage
+ x2("\\A((a|b)\?\?)?z", "bz", 0, 2); // up coverage
+ x2("((?<x>abc){0}a\\g<x>d)+", "aabcd", 0, 5); // up coverage
+ x2("((?(abc)true|false))+", "false", 0, 5); // up coverage
+ x2("((?i:abc)d)+", "abcdABCd", 4, 8); // up coverage
+ x2("((?<!abc)def)+", "bcdef", 2, 5); // up coverage
+ x2("(\\ba)+", "aaa", 0, 1); // up coverage
+ x2("()(?<x>ab)(?(<x>)a|b)", "aba", 0, 3); // up coverage
+ x2("(?<=a.b)c", "azbc", 3, 4); // up coverage
+ n("(?<=(?:abcde){30})z", "abc"); // up coverage
+ x2("(?<=(?(a)a|bb))z", "aaz", 2, 3); // up coverage
+ x2("[a]*\\W", "aa@", 2, 3); // up coverage
+ x2("[a]*[b]", "aab", 2, 3); // up coverage
+ n("a*\\W", "aaa"); // up coverage
+ n("(?W)a*\\W", "aaa"); // up coverage
+ x2("(?<=ab(?<=ab))", "ab", 2, 2); // up coverage
+ x2("(?<x>a)(?<x>b)(\\k<x>)+", "abbaab", 0, 6); // up coverage
+ x2("()(\\1)(\\2)", "abc", 3, 3); // up coverage
+ x2("((?(a)b|c))(\\1)", "abab", 0, 4); // up coverage
+ x2("(?<x>$|b\\g<x>)", "bbb", 3, 3); // up coverage
+ x2("(?<x>(?(a)a|b)|c\\g<x>)", "cccb", 3, 4); // up coverage
+ x2("(a)(?(1)a*|b*)+", "aaaa", 3, 4); // up coverage
+ x2("[[^abc]&&cde]*", "de", 2, 2); // up coverage
+ n("(a){10}{10}", "aa"); // up coverage
+ x2("(?:a?)+", "aa", 2, 2); // up coverage
+ x2("(?:a?)*?", "a", 1, 1); // up coverage
+ x2("(?:a*)*?", "a", 1, 1); // up coverage
+ x2("(?:a+?)*", "a", 1, 1); // up coverage
+ x2("\\h", "5", 0, 1); // up coverage
+ x2("\\H", "z", 0, 1); // up coverage
+ x2("[\\h]", "5", 0, 1); // up coverage
+ x2("[\\H]", "z", 0, 1); // up coverage
+ x2("[\\o{101}]", "A", 0, 1); // up coverage
+ x2("[\\u0041]", "A", 0, 1); // up coverage
+
+ x2("(?~)", "", 0, 0);
+ x2("(?~)", "A", 1, 1);
+ x2("aaaaa(?~)", "aaaaaaaaaa", 5, 10);
+ x2("(?~(?:|aaa))", "aaa", 3, 3);
+ x2("(?~aaa|)", "aaa", 3, 3);
+ x2("a(?~(?~)).", "abcdefghijklmnopqrstuvwxyz", 0, 26); // !!!
+ x2("/\\*(?~\\*/)\\*/", "/* */ */", 0, 5);
+ x2("(?~\\w+)zzzzz", "zzzzz", 0, 5);
+ x2("(?~\\w*)zzzzz", "zzzzz", 0, 5);
+ x2("(?~A.C|B)", "ABC", 3, 3);
+ x2("(?~XYZ|ABC)a", "ABCa", 3, 4);
+ x2("(?~XYZ|ABC)a", "aABCa", 4, 5);
+ x2("<[^>]*>(?~[<>])</[^>]*>", "<a>vvv</a> <b> </b>", 13, 22);
+ x2("(?~ab)", "ccc\ndab", 7, 7);
+ x2("(?m:(?~ab))", "ccc\ndab", 7, 7);
+ x2("(?-m:(?~ab))", "ccc\ndab", 7, 7);
+ x2("(?~abc)xyz", "xyz012345678901234567890123456789abc", 0, 3);
+
+ // absent with expr
+ x2("(?~|78|\\d*)", "123456789", 9, 9);
+ x2("(?~|def|(?:abc|de|f){0,100})", "abcdedeabcfdefabc", 17, 17);
+ x2("(?~|ab|.*)", "ccc\nddd", 7, 7);
+ x2("(?~|ab|\\O*)", "ccc\ndab", 7, 7);
+ x2("(?~|ab|\\O{2,10})", "ccc\ndab", 3, 5);
+ x2("(?~|ab|\\O{1,10})", "ab", 1, 2);
+ n("(?~|ab|\\O{2,10})", "ab");
+ x2("(?~|abc|\\O{1,10})", "abc", 2, 3);
+ x2("(?~|ab|\\O{5,10})|abc", "abc", 0, 3);
+ x2("(?~|ab|\\O{1,10})", "cccccccccccab", 12, 13);
+ x2("(?~|aaa|)", "aaa", 3, 3);
+ x2("(?~||a*)", "aaaaaa", 6, 6);
+ x2("(?~||a*?)", "aaaaaa", 6, 6);
+ x2("(a)(?~|b|\\1)", "aaaaaa", 4, 6);
+ x2("(a)(?~|bb|(?:a\\1)*)", "aaaaaa", 5, 6);
+ x2("(b|c)(?~|abac|(?:a\\1)*)", "abababacabab", 11, 12);
+ n("(?~|c|a*+)a", "aaaaa");
+ x2("(?~|aaaaa|a*+)", "aaaaa", 5, 5);
+ x2("(?~|aaaaaa|a*+)b", "aaaaaab", 6, 7);
+ x2("(?~|abcd|(?>))", "zzzabcd", 7, 7);
+ x2("(?~|abc|a*?)", "aaaabc", 6, 6);
+
+ // absent range cutter
+ x2("(?~|abc)a*", "aaaaaabc", 8, 8);
+ x2("(?~|abc)a*z|aaaaaabc", "aaaaaabc", 0, 8);
+ x2("(?~|aaaaaa)a*", "aaaaaa", 6, 6);
+ x2("(?~|abc)aaaa|aaaabc", "aaaabc", 0, 6);
+ x2("(?>(?~|abc))aaaa|aaaabc", "aaaabc", 0, 6);
+ x2("(?~|)a", "a", 0, 1);
+ n("(?~|a)a", "a");
+ x2("(?~|a)(?~|)a", "a", 0, 1);
+ x2("(?~|a).*(?~|)a", "bbbbbbbbbbbbbbbbbbbba", 20, 21);
+ x2("(?~|abc).*(xyz|pqr)(?~|)abc", "aaaaxyzaaapqrabc", 10, 16);
+ x2("(?~|abc).*(xyz|pqr)(?~|)abc", "aaaaxyzaaaabcpqrabc", 13, 19);
+ n("\\A(?~|abc).*(xyz|pqrabc)(?~|)abc", "aaaaxyzaaaabcpqrabcabc");
+
+ x2("", "あ", 3, 3);
+ x2("あ", "あ", 0, 3);
+ n("い", "あ");
+ x2("うう", "うう", 0, 6);
+ x2("あいう", "あいう", 0, 9);
+ x2("こここここここここここここここここここここここここここここここここここ", "こここここここここここここここここここここここここここここここここここ", 0, 105);
+ x2("あ", "いあ", 3, 6);
+ x2("いう", "あいう", 3, 9);
+ x2("\\xca\\xb8", "\xca\xb8", 0, 2);
+ x2(".", "あ", 0, 3);
+ x2("..", "かき", 0, 6);
+ x2("\\w", "お", 0, 3);
+ n("\\W", "あ");
+ x2("[\\W]", "う$", 3, 4);
+ x2("\\S", "そ", 0, 3);
+ x2("\\S", "漢", 0, 3);
+ x2("\\b", "気 ", 3, 3);
+ x2("\\b", " ほ", 4, 4);
+ x2("\\B", "せそ ", 7, 7);
+ x2("\\B", "う ", 4, 4);
+ x2("\\B", " い", 0, 0);
+ x2("[たち]", "ち", 0, 3);
+ n("[なに]", "ぬ");
+ x2("[う-お]", "え", 0, 3);
+ n("[^け]", "け");
+ x2("[\\w]", "ね", 0, 3);
+ n("[\\d]", "ふ");
+ x2("[\\D]", "は", 0, 3);
+ n("[\\s]", "く");
+ x2("[\\S]", "へ", 0, 3);
+ x2("[\\w\\d]", "よ", 0, 3);
+ x2("[\\w\\d]", " よ", 3, 6);
+ n("\\w鬼車", " 鬼車");
+ x2("鬼\\W車", "鬼 車", 0, 7);
+ x2("あ.い.う", "ああいいう", 0, 15);
+ x2(".\\wう\\W..ぞ", "えうう うぞぞ", 0, 19);
+ x2("\\s\\wこここ", " ここここ", 0, 13);
+ x2("ああ.け", "ああけけ", 0, 12);
+ n(".い", "いえ");
+ x2(".お", "おお", 0, 6);
+ x2("^あ", "あ", 0, 3);
+ x2("^む$", "む", 0, 3);
+ x2("^\\w$", "に", 0, 3);
+ x2("^\\wかきくけこ$", "zかきくけこ", 0, 16);
+ x2("^\\w...うえお$", "zあいううえお", 0, 19);
+ x2("\\w\\w\\s\\Wおおお\\d", "aお おおお4", 0, 16);
+ x2("\\Aたちつ", "たちつ", 0, 9);
+ x2("むめも\\Z", "むめも", 0, 9);
+ x2("かきく\\z", "かきく", 0, 9);
+ x2("かきく\\Z", "かきく\n", 0, 9);
+ n("\\Gぽぴ", "ぽぴ");
+ n("\\Gえ", "うえお");
+ x2("とて\\G", "とて", 0, 6);
+ n("まみ\\A", "まみ");
+ n("ま\\Aみ", "まみ");
+ x2("(?=せ)せ", "せ", 0, 3);
+ n("(?=う).", "い");
+ x2("(?!う)か", "か", 0, 3);
+ n("(?!と)あ", "と");
+ x2("(?i:あ)", "あ", 0, 3);
+ x2("(?i:ぶべ)", "ぶべ", 0, 6);
+ n("(?i:い)", "う");
+ x2("(?m:よ.)", "よ\n", 0, 4);
+ x2("(?m:.め)", "ま\nめ", 3, 7);
+ x2("あ?", "", 0, 0);
+ x2("変?", "化", 3, 3);
+ x2("変?", "変", 3, 3);
+ x2("量*", "", 0, 0);
+ x2("量*", "量", 3, 3);
+ x2("子*", "子子子", 9, 9);
+ x2("馬*", "鹿馬馬馬馬", 15, 15);
+ n("山+", "");
+ x2("河+", "河", 0, 3);
+ x2("時+", "時時時時", 9, 12);
+ x2("え+", "ええううう", 3, 6);
+ x2("う+", "おうううう", 12, 15);
+ x2(".?", "た", 3, 3);
+ x2(".*", "ぱぴぷぺ", 12, 12);
+ x2(".+", "ろ", 0, 3);
+ x2(".+", "いうえか\n", 9, 12);
+ x2("あ|い", "あ", 0, 3);
+ x2("あ|い", "い", 0, 3);
+ x2("あい|いう", "あい", 0, 6);
+ x2("あい|いう", "いう", 0, 6);
+ x2("を(?:かき|きく)", "をかき", 0, 9);
+ x2("を(?:かき|きく)け", "をきくけ", 0, 12);
+ x2("あい|(?:あう|あを)", "あを", 0, 6);
+ x2("あ|い|う", "えう", 3, 6);
+ x2("あ|い|うえ|おかき|く|けこさ|しすせ|そ|たち|つてとなに|ぬね", "しすせ", 0, 9);
+ n("あ|い|うえ|おかき|く|けこさ|しすせ|そ|たち|つてとなに|ぬね", "すせ");
+ x2("あ|^わ", "ぶあ", 3, 6);
+ x2("あ|^を", "をあ", 3, 6);
+ x2("鬼|\\G車", "け車鬼", 6, 9);
+ x2("鬼|\\G車", "車鬼", 3, 6);
+ x2("鬼|\\A車", "b車鬼", 4, 7);
+ x2("鬼|\\A車", "車", 0, 3);
+ x2("鬼|車\\Z", "車鬼", 3, 6);
+ x2("鬼|車\\Z", "車", 0, 3);
+ x2("鬼|車\\Z", "車\n", 0, 3);
+ x2("鬼|車\\z", "車鬼", 3, 6);
+ x2("鬼|車\\z", "車", 0, 3);
+ x2("\\w|\\s", "お", 0, 3);
+ x2("\\w|%", "%お", 1, 4);
+ x2("\\w|[&$]", "う&", 3, 4);
+ x2("[い-け]", "う", 0, 3);
+ x2("[い-け]|[^か-こ]", "あ", 0, 3);
+ x2("[い-け]|[^か-こ]", "か", 0, 3);
+ x2("[^あ]", "\n", 0, 1);
+ x2("(?:あ|[う-き])|いを", "うを", 0, 3);
+ x2("(?:あ|[う-き])|いを", "いを", 0, 6);
+ x2("あいう|(?=けけ)..ほ", "けけほ", 0, 9);
+ x2("あいう|(?!けけ)..ほ", "あいほ", 0, 9);
+ x2("(?=をあ)..あ|(?=をを)..あ", "ををあ", 0, 9);
+ x2("(?<=あ|いう)い", "いうい", 6, 9);
+ n("(?>あ|あいえ)う", "あいえう");
+ x2("(?>あいえ|あ)う", "あいえう", 0, 12);
+ x2("あ?|い", "あ", 3, 3);
+ x2("あ?|い", "い", 3, 3);
+ x2("あ?|い", "", 0, 0);
+ x2("あ*|い", "ああ", 6, 6);
+ x2("あ*|い*", "いあ", 6, 6);
+ x2("あ*|い*", "あい", 6, 6);
+ x2("[aあ]*|い*", "aあいいい", 13, 13);
+ x2("あ+|い*", "", 0, 0);
+ x2("あ+|い*", "いいい", 9, 9);
+ x2("あ+|い*", "あいいい", 12, 12);
+ x2("あ+|い*", "aあいいい", 13, 13);
+ n("あ+|い+", "");
+ x2("(あ|い)?", "い", 3, 3);
+ x2("(あ|い)*", "いあ", 6, 6);
+ x2("(あ|い)+", "いあい", 6, 9);
+ x2("(あい|うあ)+", "うああいうえ", 6, 12);
+ x2("(あい|うえ)+", "うああいうえ", 12, 18);
+ x2("(あい|うあ)+", "ああいうあ", 9, 15);
+ x2("(あい|うあ)+", "あいをうあ", 9, 15);
+ x2("(あい|うあ)+", "$$zzzzあいをうあ", 15, 21);
+ x2("(あ|いあい)+", "あいあいあ", 12, 15);
+ x2("(あ|いあい)+", "いあ", 3, 6);
+ x2("(あ|いあい)+", "いあああいあ", 15, 18);
+ x2("(?:あ|い)(?:あ|い)", "あい", 0, 6);
+ x2("(?:あ*|い*)(?:あ*|い*)", "あああいいい", 18, 18);
+ x2("(?:あ*|い*)(?:あ+|い+)", "あああいいい", 15, 18);
+ x2("(?:あ+|い+){2}", "あああいいい", 12, 18);
+ x2("(?:あ+|い+){1,2}", "あああいいい", 15, 18);
+ x2("(?:あ+|\\Aい*)うう", "うう", 0, 6);
+ n("(?:あ+|\\Aい*)うう", "あいうう");
+ x2("(?:^あ+|い+)*う", "ああいいいあいう", 21, 24);
+ x2("(?:^あ+|い+)*う", "ああいいいいう", 18, 21);
+ x2("う{0,}", "うううう", 12, 12);
+ x2("あ|(?i)c", "C", 0, 1);
+ x2("(?i)c|あ", "C", 0, 1);
+ x2("(?i:あ)|a", "a", 0, 1);
+ n("(?i:あ)|a", "A");
+ x2("[あいう]?", "あいう", 9, 9);
+ x2("[あいう]*", "あいう", 9, 9);
+ x2("[^あいう]*", "あいう", 9, 9);
+ n("[^あいう]+", "あいう");
+ x2("あ?\?", "あああ", 9, 9);
+ x2("いあ?\?い", "いあい", 0, 9);
+ x2("あ*?", "あああ", 9, 9);
+ x2("いあ*?", "いああ", 0, 3);
+ x2("いあ*?い", "いああい", 0, 12);
+ x2("あ+?", "あああ", 6, 9);
+ x2("いあ+?", "いああ", 0, 6);
+ x2("いあ+?い", "いああい", 0, 12);
+ x2("(?:天?)?\?", "天", 3, 3);
+ x2("(?:天?\?)?", "天", 3, 3);
+ x2("(?:夢?)+?", "夢夢夢", 9, 9);
+ x2("(?:風+)?\?", "風風風", 9, 9);
+ x2("(?:雪+)?\?霜", "雪雪雪霜", 9, 12);
+ x2("(?:あい)?{2}", "", 0, 0);
+ x2("(?:鬼車)?{2}", "鬼車鬼車鬼", 15, 15);
+ x2("(?:鬼車)*{0}", "鬼車鬼車鬼", 15, 15);
+ x2("(?:鬼車){3,}", "鬼車鬼車鬼車鬼車", 6, 24);
+ n("(?:鬼車){3,}", "鬼車鬼車");
+ x2("(?:鬼車){2,4}", "鬼車鬼車鬼車", 6, 18);
+ x2("(?:鬼車){2,4}", "鬼車鬼車鬼車鬼車鬼車", 18, 30);
+ x2("(?:鬼車){2,4}?", "鬼車鬼車鬼車鬼車鬼車", 18, 30);
+ x2("(?:鬼車){,}", "鬼車{,}", 0, 9);
+ x2("(?:かきく)+?{2}", "かきくかきくかきく", 9, 27);
+ x3("(火)", "火", 0, 3, 1);
+ x3("(火水)", "火水", 0, 6, 1);
+ x2("((時間))", "時間", 0, 6);
+ x3("((風水))", "風水", 0, 6, 1);
+ x3("((昨日))", "昨日", 0, 6, 2);
+ x3("((((((((((((((((((((量子))))))))))))))))))))", "量子", 0, 6, 20);
+ x3("(あい)(うえ)", "あいうえ", 0, 6, 1);
+ x3("(あい)(うえ)", "あいうえ", 6, 12, 2);
+ x3("()(あ)いう(えおか)きくけこ", "あいうえおかきくけこ", 9, 18, 3);
+ x3("(()(あ)いう(えおか)きくけこ)", "あいうえおかきくけこ", 9, 18, 4);
+ x3(".*(フォ)ン・マ(ン()シュタ)イン", "フォン・マンシュタイン", 15, 27, 2);
+ x2("(^あ)", "あ", 0, 3);
+ x3("(あ)|(あ)", "いあ", 3, 6, 1);
+ x3("(^あ)|(あ)", "いあ", 3, 6, 2);
+ x3("(あ?)", "あああ", 9, 9, 1);
+ x3("(ま*)", "ままま", 9, 9, 1);
+ x3("(と*)", "", 0, 0, 1);
+ x3("(る+)", "るるるるるるる", 18, 21, 1);
+ x3("(ふ+|へ*)", "ふふふへへ", 15, 15, 1);
+ x3("(あ+|い?)", "いいいああ", 15, 15, 1);
+ x3("(あいう)?", "あいう", -1, -1, 1);
+ x3("(あいう)*", "あいう", -1, -1, 1);
+ x3("(あいう)+", "あいう", 0, 9, 1);
+ x3("(さしす|あいう)+", "あいう", 0, 9, 1);
+ x3("([なにぬ][かきく]|かきく)+", "かきく", 0, 9, 1);
+ x3("((?i:あいう))", "あいう", 0, 9, 1);
+ x3("((?m:あ.う))", "あ\nう", 0, 7, 1);
+ x3("((?=あん)あ)", "あんい", 0, 3, 1);
+ x3("あいう|(.あいえ)", "んあいえ", 0, 12, 1);
+ x3("あ*(.)", "ああああん", 12, 15, 1);
+ x3("あ*?(.)", "ああああん", 12, 15, 1);
+ x3("あ*?(ん)", "ああああん", 12, 15, 1);
+ x3("[いうえ]あ*(.)", "えああああん", 15, 18, 1);
+ x3("(\\Aいい)うう", "いいうう", 0, 6, 1);
+ n("(\\Aいい)うう", "んいいうう");
+ x3("(^いい)うう", "いいうう", 0, 6, 1);
+ n("(^いい)うう", "んいいうう");
+ x3("ろろ(るる$)", "ろろるる", 6, 12, 1);
+ n("ろろ(るる$)", "ろろるるる");
+ x2("(無)\\1", "無無", 0, 6);
+ n("(無)\\1", "無武");
+ x2("(空?)\\1", "空空", 6, 6);
+ x2("(空?\?)\\1", "空空", 6, 6);
+ x2("(空*)\\1", "空空空空空", 15, 15);
+ x3("(空*)\\1", "空空空空空", 15, 15, 1);
+ x2("あ(い*)\\1", "あいいいい", 0, 15);
+ x2("あ(い*)\\1", "あい", 0, 3);
+ x2("(あ*)(い*)\\1\\2", "あああいいあああいい", 30, 30);
+ x2("(あ*)(い*)\\2", "あああいいいい", 21, 21);
+ x3("(あ*)(い*)\\2", "あああいいいい", 21, 21, 2);
+ x2("(((((((ぽ*)ぺ))))))ぴ\\7", "ぽぽぽぺぴぽぽぽ", 9, 15);
+ x3("(((((((ぽ*)ぺ))))))ぴ\\7", "ぽぽぽぺぴぽぽぽ", 9, 9, 7);
+ x2("(は)(ひ)(ふ)\\2\\1\\3", "はひふひはふ", 0, 18);
+ x2("([き-け])\\1", "くく", 0, 6);
+ x2("(\\w\\d\\s)\\1", "あ5 あ5 ", 0, 10);
+ n("(\\w\\d\\s)\\1", "あ5 あ5");
+ x2("(誰?|[あ-う]{3})\\1", "誰?誰?", 0, 12);
+ x2("...(誰?|[あ-う]{3})\\1", "あaあ誰?誰?", 0, 19);
+ x2("(誰?|[あ-う]{3})\\1", "ういうういう", 0, 18);
+ x2("(^こ)\\1", "ここ", 0, 6);
+ n("(^む)\\1", "めむむ");
+ n("(あ$)\\1", "ああ");
+ n("(あい\\Z)\\1", "あい");
+ x2("(あ*\\Z)\\1", "あ", 3, 3);
+ x2(".(あ*\\Z)\\1", "いあ", 3, 6);
+ x3("(.(やいゆ)\\2)", "zやいゆやいゆ", 0, 19, 1);
+ x3("(.(..\\d.)\\2)", "あ12341234", 0, 11, 1);
+ x2("((?i:あvず))\\1", "あvずあvず", 0, 14);
+ x2("(?<愚か>変|\\(\\g<愚か>\\))", "((((((変))))))", 6, 9);
+ x2("\\A(?:\\g<阿_1>|\\g<云_2>|\\z終了 (?<阿_1>観|自\\g<云_2>自)(?<云_2>在|菩薩\\g<阿_1>菩薩))$", "菩薩自菩薩自在自菩薩自菩薩", 0, 39);
+ x2("[[ひふ]]", "ふ", 0, 3);
+ x2("[[いおう]か]", "か", 0, 3);
+ n("[[^あ]]", "あ");
+ n("[^[あ]]", "あ");
+ x2("[^[^あ]]", "あ", 0, 3);
+ x2("[[かきく]&&きく]", "く", 0, 3);
+ n("[[かきく]&&きく]", "か");
+ n("[[かきく]&&きく]", "け");
+ x2("[あ-ん&&い-を&&う-ゑ]", "ゑ", 0, 3);
+ n("[^あ-ん&&い-を&&う-ゑ]", "ゑ");
+ x2("[[^あ&&あ]&&あ-ん]", "い", 0, 3);
+ n("[[^あ&&あ]&&あ-ん]", "あ");
+ x2("[[^あ-ん&&いうえお]&&[^う-か]]", "き", 0, 3);
+ n("[[^あ-ん&&いうえお]&&[^う-か]]", "い");
+ x2("[^[^あいう]&&[^うえお]]", "う", 0, 3);
+ x2("[^[^あいう]&&[^うえお]]", "え", 0, 3);
+ n("[^[^あいう]&&[^うえお]]", "か");
+ x2("[あ-&&-あ]", "-", 0, 1);
+ x2("[^[^a-zあいう]&&[^bcdefgうえお]q-w]", "え", 0, 3);
+ x2("[^[^a-zあいう]&&[^bcdefgうえお]g-w]", "f", 0, 1);
+ x2("[^[^a-zあいう]&&[^bcdefgうえお]g-w]", "g", 0, 1);
+ n("[^[^a-zあいう]&&[^bcdefgうえお]g-w]", "2");
+ x2("a<b>バージョンのダウンロード<\\/b>", "a<b>バージョンのダウンロード</b>", 0, 44);
+ x2(".<b>バージョンのダウンロード<\\/b>", "a<b>バージョンのダウンロード</b>", 0, 44);
+ x2("\\n?\\z", "こんにちは", 15, 15);
+ x2("(?m).*", "青赤黄", 9, 9);
+ x2("(?m).*a", "青赤黄a", 9, 10);
+
+ x2("\\p{Hiragana}", "ぴ", 0, 3);
+ n("\\P{Hiragana}", "ぴ");
+ x2("\\p{Emoji}", "\xE2\xAD\x90", 0, 3);
+ x2("\\p{^Emoji}", "\xEF\xBC\x93", 0, 3);
+ x2("\\p{Extended_Pictographic}", "\xE2\x9A\xA1", 0, 3);
+ n("\\p{Extended_Pictographic}", "\xE3\x81\x82");
+
+ x2("\\p{Word}", "こ", 0, 3);
+ n("\\p{^Word}", "こ");
+ x2("[\\p{Word}]", "こ", 0, 3);
+ n("[\\p{^Word}]", "こ");
+ n("[^\\p{Word}]", "こ");
+ x2("[^\\p{^Word}]", "こ", 0, 3);
+ x2("[^\\p{^Word}&&\\p{ASCII}]", "こ", 0, 3);
+ x2("[^\\p{^Word}&&\\p{ASCII}]", "a", 0, 1);
+ n("[^\\p{^Word}&&\\p{ASCII}]", "#");
+ x2("[^[\\p{^Word}]&&[\\p{ASCII}]]", "こ", 0, 3);
+ x2("[^[\\p{ASCII}]&&[^\\p{Word}]]", "こ", 0, 3);
+ n("[[\\p{ASCII}]&&[^\\p{Word}]]", "こ");
+ x2("[^[\\p{^Word}]&&[^\\p{ASCII}]]", "こ", 0, 3);
+ x2("[^\\x{104a}]", "こ", 0, 3);
+ x2("[^\\p{^Word}&&[^\\x{104a}]]", "こ", 0, 3);
+ x2("[^[\\p{^Word}]&&[^\\x{104a}]]", "こ", 0, 3);
+ n("[^\\p{Word}||[^\\x{104a}]]", "こ");
+
+ x2("\\p{^Cntrl}", "こ", 0, 3);
+ n("\\p{Cntrl}", "こ");
+ x2("[\\p{^Cntrl}]", "こ", 0, 3);
+ n("[\\p{Cntrl}]", "こ");
+ n("[^\\p{^Cntrl}]", "こ");
+ x2("[^\\p{Cntrl}]", "こ", 0, 3);
+ x2("[^\\p{Cntrl}&&\\p{ASCII}]", "こ", 0, 3);
+ x2("[^\\p{Cntrl}&&\\p{ASCII}]", "a", 0, 1);
+ n("[^\\p{^Cntrl}&&\\p{ASCII}]", "#");
+ x2("[^[\\p{^Cntrl}]&&[\\p{ASCII}]]", "こ", 0, 3);
+ x2("[^[\\p{ASCII}]&&[^\\p{Cntrl}]]", "こ", 0, 3);
+ n("[[\\p{ASCII}]&&[^\\p{Cntrl}]]", "こ");
+ n("[^[\\p{^Cntrl}]&&[^\\p{ASCII}]]", "こ");
+ n("[^\\p{^Cntrl}&&[^\\x{104a}]]", "こ");
+ n("[^[\\p{^Cntrl}]&&[^\\x{104a}]]", "こ");
+ n("[^\\p{Cntrl}||[^\\x{104a}]]", "こ");
+
+ x2("(?-W:\\p{Word})", "こ", 0, 3);
+ n("(?W:\\p{Word})", "こ");
+ x2("(?W:\\p{Word})", "k", 0, 1);
+ x2("(?-W:[[:word:]])", "こ", 0, 3);
+ n("(?W:[[:word:]])", "こ");
+ x2("(?-D:\\p{Digit})", "3", 0, 3);
+ n("(?D:\\p{Digit})", "3");
+ x2("(?-S:\\p{Space})", "\xc2\x85", 0, 2);
+ n("(?S:\\p{Space})", "\xc2\x85");
+ x2("(?-P:\\p{Word})", "こ", 0, 3);
+ n("(?P:\\p{Word})", "こ");
+ x2("(?-W:\\w)", "こ", 0, 3);
+ n("(?W:\\w)", "こ");
+ x2("(?-W:\\w)", "k", 0, 1);
+ x2("(?W:\\w)", "k", 0, 1);
+ n("(?-W:\\W)", "こ");
+ x2("(?W:\\W)", "こ", 0, 3);
+ n("(?-W:\\W)", "k");
+ n("(?W:\\W)", "k");
+
+ x2("(?-W:\\b)", "こ", 3, 3);
+ n("(?W:\\b)", "こ");
+ x2("(?-W:\\b)", "h", 1, 1);
+ x2("(?W:\\b)", "h", 1, 1);
+ n("(?-W:\\B)", "こ");
+ x2("(?W:\\B)", "こ", 3, 3);
+ n("(?-W:\\B)", "h");
+ n("(?W:\\B)", "h");
+ x2("(?-P:\\b)", "こ", 3, 3);
+ n("(?P:\\b)", "こ");
+ x2("(?-P:\\b)", "h", 1, 1);
+ x2("(?P:\\b)", "h", 1, 1);
+ n("(?-P:\\B)", "こ");
+ x2("(?P:\\B)", "こ", 3, 3);
+ n("(?-P:\\B)", "h");
+ n("(?P:\\B)", "h");
+
+ x2("\\p{InBasicLatin}", "\x41", 0, 1);
+ //x2("\\p{Grapheme_Cluster_Break_Regional_Indicator}", "\xF0\x9F\x87\xA9", 0, 4);
+ //n("\\p{Grapheme_Cluster_Break_Regional_Indicator}", "\xF0\x9F\x87\xA5");
+
+ // extended grapheme cluster
+
+ // CR + LF
+ n(".\\y\\O", "\x0d\x0a");
+ x2(".\\Y\\O", "\x0d\x0a", 0, 2);
+
+ // LATIN SMALL LETTER G, COMBINING DIAERESIS
+ n("^.\\y.$", "\x67\xCC\x88");
+ x2(".\\Y.", "\x67\xCC\x88", 0, 3);
+ x2("\\y.\\Y.\\y", "\x67\xCC\x88", 0, 3);
+ // HANGUL SYLLABLE GAG
+ x2("\\y.\\y", "\xEA\xB0\x81", 0, 3);
+ // HANGUL CHOSEONG KIYEOK, HANGUL JUNGSEONG A, HANGUL JONGSEONG KIYEOK
+ x2("^.\\Y.\\Y.$", "\xE1\x84\x80\xE1\x85\xA1\xE1\x86\xA8", 0, 9);
+ n("^.\\y.\\Y.$", "\xE1\x84\x80\xE1\x85\xA1\xE1\x86\xA8");
+ // TAMIL LETTER NA, TAMIL VOWEL SIGN I,
+ x2(".\\Y.", "\xE0\xAE\xA8\xE0\xAE\xBF", 0, 6);
+ n(".\\y.", "\xE0\xAE\xA8\xE0\xAE\xBF");
+ // THAI CHARACTER KO KAI, THAI CHARACTER SARA AM
+ x2(".\\Y.", "\xE0\xB8\x81\xE0\xB8\xB3", 0, 6);
+ n(".\\y.", "\xE0\xB8\x81\xE0\xB8\xB3");
+ // DEVANAGARI LETTER SSA, DEVANAGARI VOWEL SIGN I
+ x2(".\\Y.", "\xE0\xA4\xB7\xE0\xA4\xBF", 0, 6);
+ n(".\\y.", "\xE0\xA4\xB7\xE0\xA4\xBF");
+
+ // {Extended_Pictographic} Extend* ZWJ x {Extended_Pictographic}
+ x2("..\\Y.", "\xE3\x80\xB0\xE2\x80\x8D\xE2\xAD\x95", 0, 9);
+ x2("...\\Y.", "\xE3\x80\xB0\xCC\x82\xE2\x80\x8D\xE2\xAD\x95", 0, 11);
+ n("...\\Y.", "\xE3\x80\xB0\xCD\xB0\xE2\x80\x8D\xE2\xAD\x95");
+
+ // CR + LF
+ n("^\\X\\X$", "\x0d\x0a");
+ x2("^\\X$", "\x0d\x0a", 0, 2);
+ // LATIN SMALL LETTER G, COMBINING DIAERESIS
+ n("^\\X\\X.$", "\x67\xCC\x88");
+ x2("^\\X$", "\x67\xCC\x88", 0, 3);
+ // HANGUL CHOSEONG KIYEOK, HANGUL JUNGSEONG A, HANGUL JONGSEONG KIYEOK
+ x2("^\\X$", "\xE1\x84\x80\xE1\x85\xA1\xE1\x86\xA8", 0, 9);
+ n("^\\X\\X\\X$", "\xE1\x84\x80\xE1\x85\xA1\xE1\x86\xA8");
+ // TAMIL LETTER NA, TAMIL VOWEL SIGN I,
+ x2("^\\X$", "\xE0\xAE\xA8\xE0\xAE\xBF", 0, 6);
+ n("\\X\\X", "\xE0\xAE\xA8\xE0\xAE\xBF");
+ // THAI CHARACTER KO KAI, THAI CHARACTER SARA AM
+ x2("^\\X$", "\xE0\xB8\x81\xE0\xB8\xB3", 0, 6);
+ n("\\X\\X", "\xE0\xB8\x81\xE0\xB8\xB3");
+ // DEVANAGARI LETTER SSA, DEVANAGARI VOWEL SIGN I
+ x2("^\\X$", "\xE0\xA4\xB7\xE0\xA4\xBF", 0, 6);
+ n("\\X\\X", "\xE0\xA4\xB7\xE0\xA4\xBF");
+
+ n("^\\X.$", "\xE0\xAE\xA8\xE0\xAE\xBF");
+
+ // a + COMBINING GRAVE ACCENT (U+0300)
+ x2("h\\Xllo", "ha\xCC\x80llo", 0, 7);
+
+ // Text Segment: Extended Grapheme Cluster <-> Word Boundary
+ x2("(?y{g})\\yabc\\y", "abc", 0, 3);
+ x2("(?y{g})\\y\\X\\y", "abc", 2, 3);
+ x2("(?y{w})\\yabc\\y", "abc", 0, 3); // WB1, WB2
+ x2("(?y{w})\\y\\X", "\r\n", 0, 2); // WB3
+ x2("(?y{w})\\X", "\x0cz", 1, 2); // WB3a
+ x2("(?y{w})\\X", "q\x0c", 1, 2); // WB3b
+ x2("(?y{w})\\y\\X", "\xE2\x80\x8D\xE2\x9D\x87", 0, 6); // WB3c
+ x2("(?y{w})\\y\\X", "\x20\x20", 0, 2); // WB3d
+ x2("(?y{w})\\y\\X", "a\xE2\x80\x8D", 0, 4); // WB4
+ x2("(?y{w})\\y\\X\\y", "abc", 0, 3); // WB5
+ x2("(?y{w})\\y\\X\\y", "v\xCE\x87w", 0, 4); // WB6, WB7
+ x2("(?y{w})\\y\\X\\y", "\xD7\x93\x27", 0, 3); // WB7a
+ x2("(?y{w})\\y\\X\\y", "\xD7\x93\x22\xD7\x93", 0, 5); // WB7b, WB7c
+ x2("(?y{w})\\y\\X", "14 45", 3, 5); // WB8
+ x2("(?y{w})\\y\\X", "a14", 0, 3); // WB9
+ x2("(?y{w})\\y\\X", "832e", 0, 4); // WB10
+ x2("(?y{w})\\y\\X", "8\xEF\xBC\x8C\xDB\xB0", 0, 6); // WB11, WB12
+ x2("(?y{w})\\y\\X\\y", "ケン", 0, 6); // WB13
+ x2("(?y{w})\\y\\X\\y", "ケン\xE2\x80\xAFタ", 0, 12); // WB13a, WB13b
+ x2("(?y{w})\\y\\X\\y", "\x21\x23", 1, 2); // WB999
+ x2("(?y{w})\\y\\X\\y", "山ア", 3, 6);
+ x2("(?y{w})\\y\\X", "3.14", 0, 4);
+ x2("(?y{w})\\y\\X", "3 14", 2, 4);
+
+ x2("\\x40", "@", 0, 1);
+ x2("\\x1", "\x01", 0, 1);
+ x2("\\x{1}", "\x01", 0, 1);
+ x2("\\x{4E38}", "\xE4\xB8\xB8", 0, 3);
+ x2("\\u4E38", "\xE4\xB8\xB8", 0, 3);
+ x2("\\u0040", "@", 0, 1);
+
+ x2("c.*\\b", "abc", 2, 3);
+ x2("\\b.*abc.*\\b", "abc", 0, 3);
+ x2("((?()0+)+++(((0\\g<0>)0)|())++++((?(1)(0\\g<0>))++++++0*())++++((?(1)(0\\g<1>)+)++++++++++*())++++((?(1)((0)\\g<0>)+)++())+0++*+++(((0\\g<0>))*())++++((?(1)(0\\g<0>)+)++++++++++*|)++++*+++((?(1)((0)\\g<0>)+)+++++++++())++*|)++++((?()0))|", "abcde", 5, 5); // #139
+
+ n("(*FAIL)", "abcdefg");
+ n("abcd(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)(*FAIL)", "abcdefg");
+ x2("(?:[ab]|(*MAX{2}).)*", "abcbaaccaaa", 11, 11);
+ x2("(?:(*COUNT[AB]{X})[ab]|(*COUNT[CD]{X})[cd])*(*CMP{AB,<,CD})",
+ "abababcdab", 7, 8);
+ x2("(?(?{....})123|456)", "123", 0, 3);
+ x2("(?(*FAIL)123|456)", "456", 0, 3);
+
+ x2("\\g'0'++{,0}", "abcdefgh", 8, 8);
+ x2("\\g'0'++{,0}?", "abcdefgh", 8, 8);
+ x2("\\g'0'++{,0}b", "abcdefgh", 1, 2);
+ x2("\\g'0'++{,0}?def", "abcdefgh", 3, 6);
+ x2("a{1,3}?", "aaa", 2, 3);
+ x2("a{3}", "aaa", 0, 3);
+ x2("a{3}?", "aaa", 3, 3);
+ x2("a{3}?", "aa", 2, 2);
+ x2("a{3,3}?", "aaa", 0, 3);
+ n("a{3,3}?", "aa");
+ x2("a{1,3}+", "aaaaaa", 5, 6);
+ x2("a{3}+", "aaaaaa", 3, 6);
+ x2("a{3,3}+", "aaaaaa", 3, 6);
+ n("a{2,3}?", "a");
+ n("a{3,2}a", "aaa");
+ x2("a{3,2}b", "aaab", 1, 4);
+ x2("a{3,2}b", "aaaab", 2, 5);
+ x2("a{3,2}b", "aab", 0, 3);
+ x2("a{3,2}?", "", 0, 0); /* == (?:a{3,2})?*/
+ x2("a{2,3}+a", "aaa", 0, 3); /* == (?:a{2,3})+*/
+ x2("[\\x{0}-\\x{7fffffff}]", "a", 0, 1);
+ x2("[\\x{7f}-\\x{7fffffff}]", "\xe5\xae\xb6", 0, 3);
+ x2("[a[cdef]]", "a", 0, 1);
+ n("[a[xyz]-c]", "b");
+ x2("[a[xyz]-c]", "a", 0, 1);
+ x2("[a[xyz]-c]", "-", 0, 1);
+ x2("[a[xyz]-c]", "c", 0, 1);
+ x2("(a.c|def)(.{4})(?<=\\1)", "abcdabc", 0, 7);
+ x2("(a.c|de)(.{4})(?<=\\1)", "abcdabc", 0, 7);
+ x2("(a.c|def)(.{5})(?<=d\\1e)", "abcdabce", 0, 8);
+ x2("(a.c|.)d(?<=\\k<1>d)", "zzzzzabcdabc", 7, 9);
+ x2("(?<=az*)abc", "azzzzzzzzzzabcdabcabc", 11, 14);
+ x2("(?<=ab|abc|abcd)ef", "abcdef", 4, 6);
+ x2("(?<=ta+|tb+|tc+|td+)zz", "tcccccccccczz", 11, 13);
+ x2("(?<=t.{7}|t.{5}|t.{2}|t.)zz", "tczz", 2, 4);
+ x2("(?<=t.{7}|t.{5}|t.{2})zz", "tczzzz", 3, 5);
+ x2("(?<=t.{7}|t.{5}|t.{3})zz", "tczzazzbzz", 8, 10);
+ n("(?<=t.{7}|t.{5}|t.{3})zz", "tczzazzbczz");
+ x2("(?<=(ab|abc|abcd))ef", "abcdef", 4, 6);
+ x2("(?<=(ta+|tb+|tc+|td+))zz", "tcccccccccczz", 11, 13);
+ x2("(?<=(t.{7}|t.{5}|t.{2}|t.))zz", "tczz", 2, 4);
+ x2("(?<=(t.{7}|t.{5}|t.{2}))zz", "tczzzz", 3, 5);
+ x2("(?<=(t.{7}|t.{5}|t.{3}))zz", "tczzazzbzz", 8, 10);
+ n("(?<=(t.{7}|t.{5}|t.{3}))zz", "tczzazzbczz");
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "abaaba", 2, 4);
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "ababab", 2, 6);
+ n("(.{1,4})(.{1,4})(?<=\\2\\1)", "abcdabce");
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "abcdabceabce", 4, 12);
+ x2("(?<=a)", "a", 1, 1);
+ x2("(?<=a.*\\w)z", "abbbz", 4, 5);
+ n("(?<=a.*\\w)z", "abb z");
+ x2("(?<=a.*\\W)z", "abb z", 4, 5);
+ x2("(?<=a.*\\b)z", "abb z", 4, 5);
+ x2("(?<=(?>abc))", "abc", 3, 3);
+ x2("(?<=a\\Xz)", "abz", 3, 3);
+ n("(?<=^a*)bc", "zabc");
+ n("(?<=a*\\b)b", "abc");
+ x2("(?<=a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=a+.*[efg])z", "abcdfgz", 6, 7);
+ n("(?<=a+.*[efg])z", "bcdfz");
+ x2("(?<=a*.*[efg])z", "bcdfz", 4, 5);
+ n("(?<=a+.*[efg])z", "abcdz");
+ x2("(?<=v|t|a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=v|t|^a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=^(?:v|t|a+.*[efg]))z", "abcdfz", 5, 6);
+ x2("(?<=v|^t|a+.*[efg])z", "uabcdfz", 6, 7);
+ n("^..(?<=(a{,2}))\\1z", "aaaaz"); // !!! look-behind is shortest priority
+ x2("^..(?<=(a{,2}))\\1z", "aaz", 0, 3); // shortest priority
+ e("(?<=(?~|zoo)a.*z)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ e("(?<=(?~|)a.*z)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ e("(a(?~|boo)z){0}(?<=\\g<1>)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ x2("(?<=(?<= )| )", "abcde fg", 6, 6); // #173
+ x2("(?<=D|)(?<=@!nnnnnnnnnIIIIn;{1}D?()|<x@x*xxxD|)(?<=@xxx|xxxxx\\g<1>;{1}x)", "(?<=D|)(?<=@!nnnnnnnnnIIIIn;{1}D?()|<x@x*xxxD|)(?<=@xxx|xxxxx\\g<1>;{1}x)", 55, 55); // #173
+ x2("(?<=;()|)\\g<1>", "", 0, 0); // reduced #173
+ x2("(?<=;()|)\\k<1>", ";", 1, 1);
+ x2("(())\\g<3>{0}(?<=|())", "abc", 3, 3); // #175
+ x2("(?<=()|)\\1{0}", "abc", 3, 3);
+ e("(?<!xxxxxxxxxxxxxxxxxxxxxxx{32774}{65521}xxxxxxxx{65521}xxxxxxxxxxxxxx{32774}xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx)", "", ONIGERR_INVALID_LOOK_BEHIND_PATTERN); // #177
+ x2("(?<=(?<=abc))def", "abcdef", 3, 6);
+ x2("(?<=ab(?<=.+b)c)def", "abcdef", 3, 6);
+ n("(?<=ab(?<=a+)c)def", "abcdef");
+ n("(?<=abc)(?<!abc)def", "abcdef");
+ n("(?<!ab.)(?<=.bc)def", "abcdef");
+ x2("(?<!ab.)(?<=.bc)def", "abcdefcbcdef", 9, 12);
+ n("(?<!abc)def", "abcdef");
+ n("(?<!xxx|abc)def", "abcdef");
+ n("(?<!xxxxx|abc)def", "abcdef");
+ n("(?<!xxxxx|abc)def", "xxxxxxdef");
+ n("(?<!x+|abc)def", "abcdef");
+ n("(?<!x+|abc)def", "xxxxxxxxxdef");
+ x2("(?<!x+|abc)def", "xxxxxxxxzdef", 9, 12);
+ n("(?<!a.*z|a)def", "axxxxxxxzdef");
+ n("(?<!a.*z|a)def", "bxxxxxxxadef");
+ x2("(?<!a.*z|a)def", "axxxxxxxzdefxxdef", 14, 17);
+ x2("(?<!a.*z|a)def", "bxxxxxxxadefxxdef", 14, 17);
+ x2("(?<!a.*z|a)def", "bxxxxxxxzdef", 9, 12);
+ x2("(?<!x+|y+)\\d+", "xxx572", 5, 6);
+ x2("(?<!3+|4+)\\d+", "33334444", 0, 8);
+ n(".(?<!3+|4+)\\d+", "33334444");
+ n("(.{,3})..(?<!\\1)", "aaaaa");
+ x2("(.{,3})..(?<!\\1)", "abcde", 2, 5);
+ x2("(.{,3})...(?<!\\1)", "abcde", 1, 5);
+ x2("(a.c)(.{3,}?)(?<!\\1)", "abcabcd", 0, 7);
+ x2("(a*)(.{3,}?)(?<!\\1)", "abcabcd", 3, 7);
+ x2("(?:(a.*b)|c.*d)(?<!(?(1))azzzb)", "azzzzb", 0, 6);
+ n("(?:(a.*b)|c.*d)(?<!(?(1))azzzb)", "azzzb");
+ x2("<(?<!NT{+}abcd)", "<(?<!NT{+}abcd)", 3, 4);
+ x2("(?<!a.*c)def", "abbbbdef", 5, 8);
+ n("(?<!a.*c)def", "abbbcdef");
+ x2("(?<!a.*X\\b)def", "abbbbbXdef", 7, 10);
+ n("(?<!a.*X\\B)def", "abbbbbXdef");
+ x2("(?<!a.*[uvw])def", "abbbbbXdef", 7, 10);
+ n("(?<!a.*[uvw])def", "abbbbbwdef");
+ x2("(?<!ab*\\S+)def", "abbbbb def", 9, 12);
+ x2("(?<!a.*\\S)def", "abbbbb def", 7, 10);
+ n("(?<!ab*\\s+)def", "abbbbb def");
+ x2("(?<!ab*\\s+\\B)def", "abbbbb def", 9, 12);
+ n("(?<!v|t|a+.*[efg])z", "abcdfz");
+ x2("(?<!v|t|a+.*[efg])z", "abcdfzavzuz", 10, 11);
+ n("(?<!v|t|^a+.*[efg])z", "abcdfz");
+ n("(?<!^(?:v|t|a+.*[efg]))z", "abcdfz");
+ x2("(?<!v|^t|^a+.*[efg])z", "uabcdfz", 6, 7);
+
+ x2("((?(a)\\g<1>|b))", "aab", 2, 3);
+ x2("((?(a)\\g<1>))", "aab", 1, 2);
+ x2("(b(?(a)|\\g<1>))", "bba", 1, 3);
+ e("(()(?(2)\\g<1>))", "", ONIGERR_NEVER_ENDING_RECURSION);
+ x2("(?(a)(?:b|c))", "ac", 0, 2);
+ n("^(?(a)b|c)", "ac");
+ x2("(?i)a|b", "B", 0, 1);
+ n("((?i)a|b.)|c", "C");
+ n("c(?i)a.|b.", "Caz");
+ x2("c(?i)a|b", "cB", 0, 2); /* == c(?i:a|b) */
+ x2("c(?i)a.|b.", "cBb", 0, 3);
+
+ x2("(?i)st", "st", 0, 2);
+ x2("(?i)st", "St", 0, 2);
+ x2("(?i)st", "sT", 0, 2);
+ x2("(?i)st", "\xC5\xBFt", 0, 3); // U+017F
+ x2("(?i)st", "\xEF\xAC\x85", 0, 3); // U+FB05
+ x2("(?i)st", "\xEF\xAC\x86", 0, 3); // U+FB06
+ x2("(?i)ast", "Ast", 0, 3);
+ x2("(?i)ast", "ASt", 0, 3);
+ x2("(?i)ast", "AsT", 0, 3);
+ x2("(?i)ast", "A\xC5\xBFt", 0, 4); // U+017F
+ x2("(?i)ast", "A\xEF\xAC\x85", 0, 4); // U+FB05
+ x2("(?i)ast", "A\xEF\xAC\x86", 0, 4); // U+FB06
+ x2("(?i)stZ", "stz", 0, 3);
+ x2("(?i)stZ", "Stz", 0, 3);
+ x2("(?i)stZ", "sTz", 0, 3);
+ x2("(?i)stZ", "\xC5\xBFtz", 0, 4); // U+017F
+ x2("(?i)stZ", "\xEF\xAC\x85z", 0, 4); // U+FB05
+ x2("(?i)stZ", "\xEF\xAC\x86z", 0, 4); // U+FB06
+ x2("(?i)BstZ", "bstz", 0, 4);
+ x2("(?i)BstZ", "bStz", 0, 4);
+ x2("(?i)BstZ", "bsTz", 0, 4);
+ x2("(?i)BstZ", "b\xC5\xBFtz", 0, 5); // U+017F
+ x2("(?i)BstZ", "b\xEF\xAC\x85z", 0, 5); // U+FB05
+ x2("(?i)BstZ", "b\xEF\xAC\x86z", 0, 5); // U+FB06
+ x2("(?i).*st\\z", "tttssss\xC5\xBFt", 7, 10); // U+017F
+ x2("(?i).*st\\z", "tttssss\xEF\xAC\x85", 7, 10); // U+FB05
+ x2("(?i).*st\\z", "tttssss\xEF\xAC\x86", 7, 10); // U+FB06
+ x2("(?i).*あstい\\z", "tttssssあ\xC5\xBFtい", 7, 16); // U+017F
+ x2("(?i).*あstい\\z", "tttssssあ\xEF\xAC\x85い", 7, 16); // U+FB05
+ x2("(?i).*あstい\\z", "tttssssあ\xEF\xAC\x86い", 7, 16); // U+FB06
+ x2("(?i).*\xC5\xBFt\\z", "tttssssst", 7, 9); // U+017F
+ x2("(?i).*\xEF\xAC\x85\\z", "tttssssあst", 10, 12); // U+FB05
+ x2("(?i).*\xEF\xAC\x86い\\z", "tttssssstい", 7, 12); // U+FB06
+ x2("(?i).*\xEF\xAC\x85\\z", "tttssssあ\xEF\xAC\x85", 10, 13);
+
+ x2("(?i).*ss", "abcdefghijklmnopqrstuvwxyz\xc3\x9f", 26, 28); // U+00DF
+ x2("(?i).*ss.*", "abcdefghijklmnopqrstuvwxyz\xc3\x9fxyz", 26, 31); // U+00DF
+ x2("(?i).*\xc3\x9f", "abcdefghijklmnopqrstuvwxyzss", 26, 28); // U+00DF
+ x2("(?i).*ss.*", "abcdefghijklmnopqrstuvwxyzSSxyz", 26, 31);
+
+ x2("(?i)ssv", "\xc3\x9fv", 0, 3); // U+00DF
+ x2("(?i)(?<=ss)v", "SSv", 2, 3);
+ x2("(?i)(?<=\xc3\x9f)v", "\xc3\x9fv", 2, 3);
+ //x2("(?i)(?<=\xc3\x9f)v", "ssv", 2, 3);
+ //x2("(?i)(?<=ss)v", "\xc3\x9fv", 2, 3);
+
+ /* #156 U+01F0 (UTF-8: C7 B0) */
+ x2("(?i).+Isssǰ", ".+Isssǰ", 1, 8);
+ x2(".+Isssǰ", ".+Isssǰ", 1, 8);
+ x2("(?i)ǰ", "ǰ", 0, 2);
+ x2("(?i)ǰ", "j\xcc\x8c", 0, 3);
+ x2("(?i)j\xcc\x8c", "ǰ", 0, 2);
+ x2("(?i)5ǰ", "5ǰ", 0, 3);
+ x2("(?i)5ǰ", "5j\xcc\x8c", 0, 4);
+ x2("(?i)5j\xcc\x8c", "5ǰ", 0, 3);
+ x2("(?i)ǰv", "ǰV", 0, 3);
+ x2("(?i)ǰv", "j\xcc\x8cV", 0, 4);
+ x2("(?i)j\xcc\x8cv", "ǰV", 0, 3);
+ x2("(?i)[ǰ]", "ǰ", 0, 2);
+ x2("(?i)[ǰ]", "j\xcc\x8c", 0, 3);
+ //x2("(?i)[j]\xcc\x8c", "ǰ", 0, 2);
+ x2("(?i)\ufb00a", "ffa", 0, 3);
+ x2("(?i)ffz", "\xef\xac\x80z", 0, 4);
+ x2("(?i)\u2126", "\xcf\x89", 0, 2);
+ x2("a(?i)\u2126", "a\xcf\x89", 0, 3);
+ x2("(?i)A\u2126", "a\xcf\x89", 0, 3);
+ x2("(?i)A\u2126=", "a\xcf\x89=", 0, 4);
+ x2("(?i:ss)=1234567890", "\xc5\xbf\xc5\xbf=1234567890", 0, 15);
+
+ n("a(b|)+d", "abbbbbbbbbbbbbbbbbbbbbbbbbbbbbbcd"); /* https://www.haijin-boys.com/discussions/5079 */
+ n(" \xfd", ""); /* https://bugs.php.net/bug.php?id=77370 */
+ /* can't use \xfc00.. because compiler error: hex escape sequence out of range */
+ n("()0\\xfc00000\\xfc00000\\xfc00000\xfc", ""); /* https://bugs.php.net/bug.php?id=77371 */
+ x2("000||0\xfa", "0", 1, 1);
+ e("(?i)000000000000000000000\xf0", "", ONIGERR_INVALID_CODE_POINT_VALUE); /* https://bugs.php.net/bug.php?id=77382 */
+ n("0000\\\xf5", "0"); /* https://bugs.php.net/bug.php?id=77385 */
+ n("(?i)FFF00000000000000000\xfd", ""); /* https://bugs.php.net/bug.php?id=77394 */
+ e("x{55380}{77590}", "", ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE);
+ e("(xyz){40000}{99999}(?<name>vv)", "", ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE);
+ e("f{90000,90000}{80000,80000}", "", ONIGERR_TOO_BIG_NUMBER_FOR_REPEAT_RANGE);
+ n("f{90000,90000}{80000,80001}", "");
+
+ x2("\\p{Common}", "\xe3\x8b\xbf", 0, 3); /* U+32FF */
+ x2("\\p{In_Enclosed_CJK_Letters_and_Months}", "\xe3\x8b\xbf", 0, 3); /* U+32FF */
+
+ e("\\x{7fffffff}", "", ONIGERR_TOO_BIG_WIDE_CHAR_VALUE);
+ e("[\\x{7fffffff}]", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\u040", "@", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("(?<abc>\\g<abc>)", "zzzz", ONIGERR_NEVER_ENDING_RECURSION);
+ e("(*FOO)", "abcdefg", ONIGERR_UNDEFINED_CALLOUT_NAME);
+ e("*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("|*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?i)*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?:*)", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?m:*)", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ x2("(?:)*", "abc", 3, 3);
+ e("^*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID);
+
+ fprintf(stdout,
+ "\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
+ nsucc, nfail, nerror, onig_version());
+
+ onig_region_free(region, 1);
+ onig_end();
+
+ return ((nfail == 0 && nerror == 0) ? 0 : -1);
+}
diff --git a/test/test_regset.c b/test/test_regset.c
index 497fbd6..c8442a1 100644
--- a/test/test_regset.c
+++ b/test/test_regset.c
@@ -66,19 +66,16 @@ make_regset(int line_no, int n, char* pat[], OnigRegSet** rset, int error_no)
return 0;
}
-#ifndef _WIN32
-
static double
-get_sec(struct timespec* ts, struct timespec* te)
+get_sec(clock_t start, clock_t end)
{
double t;
- t = (te->tv_sec - ts->tv_sec) +
- (double )(te->tv_nsec - ts->tv_nsec) / 1000000000.0;
+ t = (double )(end - start) / CLOCKS_PER_SEC;
return t;
}
-/* clock_gettime() doesn't exist in Windows */
+/* use clock(), because clock_gettime() doesn't exist in Windows and old Unix. */
static int
time_test(int repeat, int n, char* ps[], char* s, char* end, double* rt_set, double* rt_reg)
@@ -87,14 +84,13 @@ time_test(int repeat, int n, char* ps[], char* s, char* end, double* rt_set, dou
int i;
int match_pos;
OnigRegSet* set;
- struct timespec ts1, ts2;
+ clock_t ts1, ts2;
double t_set, t_reg;
r = make_regset(0, n, ps, &set, 0);
if (r != 0) return r;
- clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts1);
-
+ ts1 = clock();
for (i = 0; i < repeat; i++) {
r = onig_regset_search(set, (UChar* )s, (UChar* )end, (UChar* )s, (UChar* )end,
ONIG_REGSET_POSITION_LEAD, ONIG_OPTION_NONE, &match_pos);
@@ -104,12 +100,10 @@ time_test(int repeat, int n, char* ps[], char* s, char* end, double* rt_set, dou
}
}
- clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts2);
- t_set = get_sec(&ts1, &ts2);
-
-
- clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts1);
+ ts2 = clock();
+ t_set = get_sec(ts1, ts2);
+ ts1 = clock();
for (i = 0; i < repeat; i++) {
r = onig_regset_search(set, (UChar* )s, (UChar* )end, (UChar* )s, (UChar* )end,
ONIG_REGSET_REGEX_LEAD, ONIG_OPTION_NONE, &match_pos);
@@ -119,16 +113,15 @@ time_test(int repeat, int n, char* ps[], char* s, char* end, double* rt_set, dou
}
}
- clock_gettime(CLOCK_PROCESS_CPUTIME_ID, &ts2);
- onig_regset_free(set);
+ ts2 = clock();
+ t_reg = get_sec(ts1, ts2);
- t_reg = get_sec(&ts1, &ts2);
+ onig_regset_free(set);
*rt_set = t_set;
*rt_reg = t_reg;
return 0;
}
-#endif
static void
fisher_yates_shuffle(int n, char* ps[], char* cps[])
@@ -147,7 +140,6 @@ fisher_yates_shuffle(int n, char* ps[], char* cps[])
}
}
-#ifndef _WIN32
static void
time_compare(int n, char* ps[], char* s, char* end)
{
@@ -176,7 +168,6 @@ time_compare(int n, char* ps[], char* s, char* end)
fprintf(stdout, "POS lead: %6.2lfmsec. REG lead: %6.2lfmsec.\n",
total_set * 1000.0, total_reg * 1000.0);
}
-#endif
static OnigRegSetLead XX_LEAD = ONIG_REGSET_POSITION_LEAD;
@@ -391,11 +382,15 @@ static char* p7[] = {
"0+", "1+", "2+", "3+", "4+", "5+", "6+", "7+", "8+", "9+",
};
+static char* p8[] = {"a", ".*"};
+
extern int
main(int argc, char* argv[])
{
- int r;
+#ifndef _WIN32
int file_exist;
+#endif
+ int r;
char *s, *end;
OnigEncoding use_encs[1];
@@ -412,6 +407,7 @@ main(int argc, char* argv[])
N(p2, " XXXX AAA 1223 012345678bbb");
X2(p2, "0123456789", 9, 10);
X2(p7, "abcde 555 qwert", 6, 9);
+ X2(p8, "", 0, 0);
XX_LEAD = ONIG_REGSET_REGEX_LEAD;
@@ -432,22 +428,20 @@ main(int argc, char* argv[])
fprintf(stdout, "Ignore %s\n", TEXT_PATH);
file_exist = 0;
}
-#else
- file_exist = 0;
-#endif
if (file_exist != 0) {
X2(p2, s, 10, 22);
X2(p3, s, 496079, 496088);
X2(p4, s, 1294, 1315);
}
+#endif
fprintf(stdout,
"\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
nsucc, nfail, nerror, onig_version());
- if (file_exist != 0) {
#ifndef _WIN32
+ if (file_exist != 0) {
fprintf(stdout, "\n");
time_compare(ASIZE(p2), p2, s, end);
time_compare(ASIZE(p3), p3, s, end);
@@ -455,9 +449,9 @@ main(int argc, char* argv[])
time_compare(ASIZE(p5), p5, s, end);
time_compare(ASIZE(p6), p6, s, end);
fprintf(stdout, "\n");
-#endif
free(s);
}
+#endif
onig_end();
diff --git a/test/test_syntax.c b/test/test_syntax.c
new file mode 100644
index 0000000..df80e59
--- /dev/null
+++ b/test/test_syntax.c
@@ -0,0 +1,246 @@
+/*
+ * test_syntax.c
+ * Copyright (c) 2019-2020 K.Kosako
+ */
+#include "config.h"
+#ifdef ONIG_ESCAPE_UCHAR_COLLISION
+#undef ONIG_ESCAPE_UCHAR_COLLISION
+#endif
+
+#include <stdio.h>
+#include <string.h>
+#include "oniguruma.h"
+
+#define SLEN(s) strlen(s)
+
+static int nsucc = 0;
+static int nfail = 0;
+static int nerror = 0;
+
+static FILE* err_file;
+
+static OnigRegion* region;
+
+static OnigSyntaxType* Syntax;
+
+static void xx(char* pattern, char* str, int from, int to, int mem, int not,
+ int error_no)
+{
+ int r;
+ regex_t* reg;
+ OnigErrorInfo einfo;
+
+ r = onig_new(&reg, (UChar* )pattern, (UChar* )(pattern + SLEN(pattern)),
+ ONIG_OPTION_DEFAULT, ONIG_ENCODING_UTF8, Syntax, &einfo);
+ if (r) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r, &einfo);
+ fprintf(err_file, "ERROR: %s /%s/\n", s, pattern);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ %d\n", pattern, r);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL(ERROR): /%s/ '%s', %d, %d\n", pattern, str,
+ error_no, r);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ r = onig_search(reg, (UChar* )str, (UChar* )(str + SLEN(str)),
+ (UChar* )str, (UChar* )(str + SLEN(str)),
+ region, ONIG_OPTION_NONE);
+ if (r < ONIG_MISMATCH) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r);
+ fprintf(err_file, "ERROR: %s /%s/\n", s, pattern);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ '%s', %d\n", pattern, str, r);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL ERROR NO: /%s/ '%s', %d, %d\n", pattern, str,
+ error_no, r);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ if (r == ONIG_MISMATCH) {
+ if (not) {
+ fprintf(stdout, "OK(N): /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ }
+ else {
+ if (not) {
+ fprintf(stdout, "FAIL(N): /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ else {
+ if (region->beg[mem] == from && region->end[mem] == to) {
+ fprintf(stdout, "OK: /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s' %d-%d : %d-%d\n", pattern, str,
+ from, to, region->beg[mem], region->end[mem]);
+ nfail++;
+ }
+ }
+ }
+ onig_free(reg);
+}
+
+static void x2(char* pattern, char* str, int from, int to)
+{
+ xx(pattern, str, from, to, 0, 0, 0);
+}
+
+static void x3(char* pattern, char* str, int from, int to, int mem)
+{
+ xx(pattern, str, from, to, mem, 0, 0);
+}
+
+static void n(char* pattern, char* str)
+{
+ xx(pattern, str, 0, 0, 0, 1, 0);
+}
+
+static void e(char* pattern, char* str, int error_no)
+{
+ xx(pattern, str, 0, 0, 0, 0, error_no);
+}
+
+static int test_fixed_interval()
+{
+ x2("a{1,3}?", "aaa", 0, 1);
+ x2("a{3}", "aaa", 0, 3);
+ x2("a{3}?", "aaa", 0, 3);
+ n("a{3}?", "aa");
+ x2("a{3,3}?", "aaa", 0, 3);
+ n("a{3,3}?", "aa");
+
+ x2("a{1,3}+", "aaaaaa", 0, 3);
+ x2("a{3}+", "aaaaaa", 0, 3);
+ x2("a{3,3}+", "aaaaaa", 0, 3);
+
+ return 0;
+}
+
+static int test_isolated_option()
+{
+ x2("", "", 0, 0);
+ x2("^", "", 0, 0);
+ n("^a", "\na");
+ n(".", "\n");
+ x2("(?s:.)", "\n", 0, 1);
+ x2("(?s).", "\n", 0, 1);
+ x2("(?s)a|.", "\n", 0, 1);
+ n("(?s:a)|.", "\n");
+ x2("b(?s)a|.", "\n", 0, 1);
+ n("((?s)a)|.", "\n");
+ n("b(?:(?s)a)|z|.", "\n");
+ n(".|b(?s)a", "\n");
+ n(".(?s)", "\n");
+ n("(?s)(?-s)a|.", "\n");
+ x2("(?s)a|.(?-s)", "\n", 0, 1);
+ x2("(?s)a|((?-s)).", "\n", 0, 1);
+ x2("(?s)a|(?:(?-s)).", "\n", 0, 1); // !!! Perl 5.26.1 returns empty match
+ x2("(?s)a|(?:).", "\n", 0, 1); // !!! Perl 5.26.1 returns empty match
+ x2("(?s)a|(?:.)", "\n", 0, 1);
+ x2("(?s)a|(?:a*).", "\n", 0, 1);
+ n("a|(?:).", "\n"); // !!! Perl 5.26.1 returns empty match
+ n("a|(?:)(.)", "\n");
+ x2("(?s)a|(?:)(.)", "\n", 0, 1);
+ x2("b(?s)a|(?:)(.)", "\n", 0, 1);
+ n("b((?s)a)|(?:)(.)", "\n");
+
+ return 0;
+}
+
+static int test_prec_read()
+{
+ x2("(?=a).b", "ab", 0, 2);
+ x2("(?=ab|(.))\\1", "ab", 1, 2); // doesn't backtrack if success once in prec-read
+ n("(?!(.)z)a\\1", "aa"); // ! Perl 5.26.1 match with "aa"
+
+ return 0;
+}
+
+static int test_look_behind()
+{
+ x2("(?<=a)b", "ab", 1, 2);
+ x2("(?<=a|b)c", "abc", 2, 3);
+ x2("(?<=a|(.))\\1", "abcc", 3, 4);
+
+ // following is not match in Perl and Java
+ //x2("(?<=a|(.))\\1", "aa", 1, 2);
+
+ n("(?<!c|c)a", "ca");
+
+ return 0;
+}
+
+extern int main(int argc, char* argv[])
+{
+ OnigEncoding use_encs[1];
+
+ use_encs[0] = ONIG_ENCODING_UTF8;
+ onig_initialize(use_encs, sizeof(use_encs)/sizeof(use_encs[0]));
+
+ err_file = stdout;
+
+ region = onig_region_new();
+
+ Syntax = ONIG_SYNTAX_PERL;
+
+ test_fixed_interval();
+ test_isolated_option();
+ test_prec_read();
+ test_look_behind();
+ e("(?<=ab|(.))\\1", "abb", ONIGERR_INVALID_LOOK_BEHIND_PATTERN); // Variable length lookbehind not implemented in Perl 5.26.1
+
+ x3("()", "abc", 0, 0, 1);
+ e("(", "", ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS);
+ // different spec.
+ // e("\\x{7fffffff}", "", ONIGERR_TOO_BIG_WIDE_CHAR_VALUE);
+
+ Syntax = ONIG_SYNTAX_JAVA;
+
+ test_fixed_interval();
+ test_isolated_option();
+ test_prec_read();
+ test_look_behind();
+ x2("(?<=ab|(.))\\1", "abb", 2, 3);
+ n("(?<!ab|b)c", "bbc");
+ n("(?<!b|ab)c", "bbc");
+
+ fprintf(stdout,
+ "\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
+ nsucc, nfail, nerror, onig_version());
+
+ onig_region_free(region, 1);
+ onig_end();
+
+ return ((nfail == 0 && nerror == 0) ? 0 : -1);
+}
diff --git a/test/test_utf8.c b/test/test_utf8.c
index d6fc761..1bbc071 100644
--- a/test/test_utf8.c
+++ b/test/test_utf8.c
@@ -1,6 +1,6 @@
/*
* test_utf8.c
- * Copyright (c) 2019 K.Kosako
+ * Copyright (c) 2019-2020 K.Kosako
*/
#include "config.h"
#ifdef ONIG_ESCAPE_UCHAR_COLLISION
@@ -685,7 +685,7 @@ extern int main(int argc, char* argv[])
x2("aaaaa(?~)", "aaaaaaaaaa", 0, 5);
x2("(?~(?:|aaa))", "aaa", 0, 0);
x2("(?~aaa|)", "aaa", 0, 0);
- x2("a(?~(?~)).", "abcdefghijklmnopqrstuvwxyz", 0, 26); // !!!
+ x2("a(?~(?~)).", "abcdefghijklmnopqrstuvwxyz", 0, 26); // nested absent functions cause strange result
x2("/\\*(?~\\*/)\\*/", "/* */ */", 0, 5);
x2("(?~\\w+)zzzzz", "zzzzz", 0, 5);
x2("(?~\\w*)zzzzz", "zzzzz", 0, 5);
@@ -1198,6 +1198,15 @@ extern int main(int argc, char* argv[])
x2("\\g'0'++{,0}?", "abcdefgh", 0, 0);
x2("\\g'0'++{,0}b", "abcdefgh", 1, 2);
x2("\\g'0'++{,0}?def", "abcdefgh", 3, 6);
+ x2("a{1,3}?", "aaa", 0, 1);
+ x2("a{3}", "aaa", 0, 3);
+ x2("a{3}?", "aaa", 0, 3);
+ x2("a{3}?", "aa", 0, 0);
+ x2("a{3,3}?", "aaa", 0, 3);
+ n("a{3,3}?", "aa");
+ x2("a{1,3}+", "aaaaaa", 0, 6);
+ x2("a{3}+", "aaaaaa", 0, 6);
+ x2("a{3,3}+", "aaaaaa", 0, 6);
n("a{2,3}?", "a");
n("a{3,2}a", "aaa");
x2("a{3,2}b", "aaab", 0, 4);
@@ -1212,11 +1221,113 @@ extern int main(int argc, char* argv[])
x2("[a[xyz]-c]", "a", 0, 1);
x2("[a[xyz]-c]", "-", 0, 1);
x2("[a[xyz]-c]", "c", 0, 1);
+ x2("(a.c|def)(.{4})(?<=\\1)", "abcdabc", 0, 7);
+ x2("(a.c|de)(.{4})(?<=\\1)", "abcdabc", 0, 7);
+ x2("(a.c|def)(.{5})(?<=d\\1e)", "abcdabce", 0, 8);
+ x2("(a.c|.)d(?<=\\k<1>d)", "zzzzzabcdabc", 5, 9);
+ x2("(?<=az*)abc", "azzzzzzzzzzabcdabcabc", 11, 14);
+ x2("(?<=ab|abc|abcd)ef", "abcdef", 4, 6);
+ x2("(?<=ta+|tb+|tc+|td+)zz", "tcccccccccczz", 11, 13);
+ x2("(?<=t.{7}|t.{5}|t.{2}|t.)zz", "tczz", 2, 4);
+ x2("(?<=t.{7}|t.{5}|t.{2})zz", "tczzzz", 3, 5);
+ x2("(?<=t.{7}|t.{5}|t.{3})zz", "tczzazzbzz", 8, 10);
+ n("(?<=t.{7}|t.{5}|t.{3})zz", "tczzazzbczz");
+ x2("(?<=(ab|abc|abcd))ef", "abcdef", 4, 6);
+ x2("(?<=(ta+|tb+|tc+|td+))zz", "tcccccccccczz", 11, 13);
+ x2("(?<=(t.{7}|t.{5}|t.{2}|t.))zz", "tczz", 2, 4);
+ x2("(?<=(t.{7}|t.{5}|t.{2}))zz", "tczzzz", 3, 5);
+ x2("(?<=(t.{7}|t.{5}|t.{3}))zz", "tczzazzbzz", 8, 10);
+ n("(?<=(t.{7}|t.{5}|t.{3}))zz", "tczzazzbczz");
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "abaaba", 0, 6);
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "ababab", 0, 6);
+ n("(.{1,4})(.{1,4})(?<=\\2\\1)", "abcdabce");
+ x2("(.{1,4})(.{1,4})(?<=\\2\\1)", "abcdabceabce", 4, 12);
+ x2("(?<=a)", "a", 1, 1);
+ x2("(?<=a.*\\w)z", "abbbz", 4, 5);
+ n("(?<=a.*\\w)z", "abb z");
+ x2("(?<=a.*\\W)z", "abb z", 4, 5);
+ x2("(?<=a.*\\b)z", "abb z", 4, 5);
+ x2("(?<=(?>abc))", "abc", 3, 3);
+ x2("(?<=a\\Xz)", "abz", 3, 3);
+ n("(?<=^a*)bc", "zabc");
+ n("(?<=a*\\b)b", "abc");
+ x2("(?<=a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=a+.*[efg])z", "abcdfgz", 6, 7);
+ n("(?<=a+.*[efg])z", "bcdfz");
+ x2("(?<=a*.*[efg])z", "bcdfz", 4, 5);
+ n("(?<=a+.*[efg])z", "abcdz");
+ x2("(?<=v|t|a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=v|t|^a+.*[efg])z", "abcdfz", 5, 6);
+ x2("(?<=^(?:v|t|a+.*[efg]))z", "abcdfz", 5, 6);
+ x2("(?<=v|^t|a+.*[efg])z", "uabcdfz", 6, 7);
+ n("^..(?<=(a{,2}))\\1z", "aaaaz"); // !!! look-behind is shortest priority
+ x2("^..(?<=(a{,2}))\\1z", "aaz", 0, 3); // shortest priority
+ e("(?<=(?~|zoo)a.*z)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ e("(?<=(?~|)a.*z)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ e("(a(?~|boo)z){0}(?<=\\g<1>)", "abcdefz", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
+ x2("(?<=(?<= )| )", "abcde fg", 6, 6); // #173
+ x2("(?<=D|)(?<=@!nnnnnnnnnIIIIn;{1}D?()|<x@x*xxxD|)(?<=@xxx|xxxxx\\g<1>;{1}x)", "(?<=D|)(?<=@!nnnnnnnnnIIIIn;{1}D?()|<x@x*xxxD|)(?<=@xxx|xxxxx\\g<1>;{1}x)", 55, 55); // #173
+ x2("(?<=;()|)\\g<1>", "", 0, 0); // reduced #173
+ x2("(?<=;()|)\\k<1>", ";", 1, 1);
+ x2("(())\\g<3>{0}(?<=|())", "abc", 0, 0); // #175
+ x2("(?<=()|)\\1{0}", "abc", 0, 0);
+ e("(?<!xxxxxxxxxxxxxxxxxxxxxxx{32774}{65521}xxxxxxxx{65521}xxxxxxxxxxxxxx{32774}xxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxxx)", "", ONIGERR_INVALID_LOOK_BEHIND_PATTERN); // #177
+ x2("(?<=(?<=abc))def", "abcdef", 3, 6);
+ x2("(?<=ab(?<=.+b)c)def", "abcdef", 3, 6);
+ n("(?<=ab(?<=a+)c)def", "abcdef");
+ n("(?<=abc)(?<!abc)def", "abcdef");
+ n("(?<!ab.)(?<=.bc)def", "abcdef");
+ x2("(?<!ab.)(?<=.bc)def", "abcdefcbcdef", 9, 12);
+ n("(?<!abc)def", "abcdef");
+ n("(?<!xxx|abc)def", "abcdef");
+ n("(?<!xxxxx|abc)def", "abcdef");
+ n("(?<!xxxxx|abc)def", "xxxxxxdef");
+ n("(?<!x+|abc)def", "abcdef");
+ n("(?<!x+|abc)def", "xxxxxxxxxdef");
+ x2("(?<!x+|abc)def", "xxxxxxxxzdef", 9, 12);
+ n("(?<!a.*z|a)def", "axxxxxxxzdef");
+ n("(?<!a.*z|a)def", "bxxxxxxxadef");
+ x2("(?<!a.*z|a)def", "axxxxxxxzdefxxdef", 14, 17);
+ x2("(?<!a.*z|a)def", "bxxxxxxxadefxxdef", 14, 17);
+ x2("(?<!a.*z|a)def", "bxxxxxxxzdef", 9, 12);
+ x2("(?<!x+|y+)\\d+", "xxx572", 4, 6);
+ x2("(?<!3+|4+)\\d+", "33334444", 0, 8);
+ n(".(?<!3+|4+)\\d+", "33334444");
+ n("(.{,3})..(?<!\\1)", "aaaaa");
+ x2("(.{,3})..(?<!\\1)", "abcde", 0, 5);
+ x2("(.{,3})...(?<!\\1)", "abcde", 0, 5);
+ x2("(a.c)(.{3,}?)(?<!\\1)", "abcabcd", 0, 7);
+ x2("(a*)(.{3,}?)(?<!\\1)", "abcabcd", 0, 5);
+ x2("(?:(a.*b)|c.*d)(?<!(?(1))azzzb)", "azzzzb", 0, 6);
+ n("(?:(a.*b)|c.*d)(?<!(?(1))azzzb)", "azzzb");
+ x2("<(?<!NT{+}abcd)", "<(?<!NT{+}abcd)", 0, 1);
+ x2("(?<!a.*c)def", "abbbbdef", 5, 8);
+ n("(?<!a.*c)def", "abbbcdef");
+ x2("(?<!a.*X\\b)def", "abbbbbXdef", 7, 10);
+ n("(?<!a.*X\\B)def", "abbbbbXdef");
+ x2("(?<!a.*[uvw])def", "abbbbbXdef", 7, 10);
+ n("(?<!a.*[uvw])def", "abbbbbwdef");
+ x2("(?<!ab*\\S+)def", "abbbbb def", 9, 12);
+ x2("(?<!a.*\\S)def", "abbbbb def", 7, 10);
+ n("(?<!ab*\\s+)def", "abbbbb def");
+ x2("(?<!ab*\\s+\\B)def", "abbbbb def", 9, 12);
+ n("(?<!v|t|a+.*[efg])z", "abcdfz");
+ x2("(?<!v|t|a+.*[efg])z", "abcdfzavzuz", 10, 11);
+ n("(?<!v|t|^a+.*[efg])z", "abcdfz");
+ n("(?<!^(?:v|t|a+.*[efg]))z", "abcdfz");
+ x2("(?<!v|^t|^a+.*[efg])z", "uabcdfz", 6, 7);
x2("((?(a)\\g<1>|b))", "aab", 0, 3);
x2("((?(a)\\g<1>))", "aab", 0, 2);
x2("(b(?(a)|\\g<1>))", "bba", 0, 3);
e("(()(?(2)\\g<1>))", "", ONIGERR_NEVER_ENDING_RECURSION);
+ x2("(?(a)(?:b|c))", "ac", 0, 2);
+ n("^(?(a)b|c)", "ac");
+ x2("(?i)a|b", "B", 0, 1);
+ n("((?i)a|b.)|c", "C");
+ n("c(?i)a.|b.", "Caz");
+ x2("c(?i)a|b", "cB", 0, 2); /* == c(?i:a|b) */
+ x2("c(?i)a.|b.", "cBb", 0, 3);
x2("(?i)st", "st", 0, 2);
x2("(?i)st", "St", 0, 2);
@@ -1279,7 +1390,68 @@ extern int main(int argc, char* argv[])
x2("(?i)[ǰ]", "ǰ", 0, 2);
x2("(?i)[ǰ]", "j\xcc\x8c", 0, 3);
//x2("(?i)[j]\xcc\x8c", "ǰ", 0, 2);
+ x2("(?i)\ufb00a", "ffa", 0, 3);
+ x2("(?i)ffz", "\xef\xac\x80z", 0, 4);
+ x2("(?i)\u2126", "\xcf\x89", 0, 2);
+ x2("a(?i)\u2126", "a\xcf\x89", 0, 3);
+ x2("(?i)A\u2126", "a\xcf\x89", 0, 3);
+ x2("(?i)A\u2126=", "a\xcf\x89=", 0, 4);
+ x2("(?i:ss)=1234567890", "\xc5\xbf\xc5\xbf=1234567890", 0, 15);
+ x2("\\x{000A}", "\x0a", 0, 1);
+ x2("\\x{000A 002f}", "\x0a\x2f", 0, 2);
+ x2("\\x{000A 002f }", "\x0a\x2f", 0, 2);
+ x2("\\x{007C 001b}", "\x7c\x1b", 0, 2);
+ x2("\\x{1 2 3 4 5 6 7 8 9 a b c d e f}", "\x01\x02\x3\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f", 0, 15);
+ x2("a\\x{000A 002f}@", "a\x0a\x2f@", 0, 4);
+ x2("a\\x{0060\n0063}@", "a\x60\x63@", 0, 4);
+ e("\\x{00000001 000000012}", "", ONIGERR_TOO_LONG_WIDE_CHAR_VALUE);
+ e("\\x{000A 00000002f}", "", ONIGERR_TOO_LONG_WIDE_CHAR_VALUE);
+ e("\\x{000A 002f/", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\x{000A 002f /", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\x{000A", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\x{000A ", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\x{000A 002f ", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("\\o{102}", "B", 0, 1);
+ x2("\\o{102 103}", "BC", 0, 2);
+ x2("\\o{0160 0000161}", "pq", 0, 2);
+ x2("\\o{1 2 3 4 5 6 7 10 11 12 13 14 15 16 17}", "\x01\x02\x3\x04\x05\x06\x07\x08\x09\x0a\x0b\x0c\x0d\x0e\x0f", 0, 15);
+ x2("\\o{0007 0010 }", "\x07\x08", 0, 2);
+ e("\\o{0000 0015/", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\o{0000 0015 /", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\o{0015", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\o{0015 ", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("\\o{0007 002f}", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("[\\x{000A}]", "\x0a", 0, 1);
+ x2("[\\x{000A 002f}]+", "\x0a\x2f\x2e", 0, 2);
+ x2("[\\x{01 0F 1A 2c 4B}]+", "\x20\x01\x0f\x1a\x2c\x4b\x1b", 1, 6);
+ x2("[\\x{0020 0024}-\\x{0026}]+", "\x25\x24\x26\x23", 0, 3);
+ x2("[\\x{0030}-\\x{0033 005a}]+", "\x30\x31\x32\x33\x5a\34", 0, 5);
+ e("[\\x{000A]", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{000A ]", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{000A }]", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("[\\o{102}]", "B", 0, 1);
+ x2("[\\o{102 103}]*", "BC", 0, 2);
+ e("[a\\o{002 003]bcde|zzz", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("[\\x{0030-0039}]+", "abc0123456789def", 3, 13);
+ x2("[\\x{0030 - 0039 }]+", "abc0123456789def", 3, 13);
+ x2("[\\x{0030 - 0039 0063 0064}]+", "abc0123456789def", 2, 14);
+ x2("[\\x{0030 - 0039 0063-0065}]+", "acde019b", 1, 7);
+ e("[\\x{0030 - 0039-0063 0064}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{0030 - }]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{0030 -- 0040}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{0030--0040}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{0030 - - 0040}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[\\x{0030 0044 - }]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ e("[a-\\x{0070 - 0039}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("[a-\\x{0063 0071}]+", "dabcqz", 1, 5);
+ x2("[-\\x{0063-0065}]+", "ace-df", 1, 5);
+ x2("[\\x61-\\x{0063 0065}]+", "abced", 0, 4);
+ e("[\\x61-\\x{0063-0065}]+", "", ONIGERR_INVALID_CODE_POINT_VALUE);
+ x2("[t\\x{0063 0071}]+", "tcqb", 0, 3);
+ x2("[\\W\\x{0063 0071}]+", "*cqa", 0, 3);
+
+ n("a(b|)+d", "abbbbbbbbbbbbbbbbbbbbbbbbbbbbbbcd"); /* https://www.haijin-boys.com/discussions/5079 */
n(" \xfd", ""); /* https://bugs.php.net/bug.php?id=77370 */
/* can't use \xfc00.. because compiler error: hex escape sequence out of range */
n("()0\\xfc00000\\xfc00000\\xfc00000\xfc", ""); /* https://bugs.php.net/bug.php?id=77371 */
@@ -1299,8 +1471,14 @@ extern int main(int argc, char* argv[])
e("[\\x{7fffffff}]", "", ONIGERR_INVALID_CODE_POINT_VALUE);
e("\\u040", "@", ONIGERR_INVALID_CODE_POINT_VALUE);
e("(?<abc>\\g<abc>)", "zzzz", ONIGERR_NEVER_ENDING_RECURSION);
- e("(?<=(?>abc))", "abc", ONIGERR_INVALID_LOOK_BEHIND_PATTERN);
e("(*FOO)", "abcdefg", ONIGERR_UNDEFINED_CALLOUT_NAME);
+ e("*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("|*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?i)*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?:*)", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ e("(?m:*)", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_NOT_SPECIFIED);
+ x2("(?:)*", "abc", 0, 0);
+ e("^*", "abc", ONIGERR_TARGET_OF_REPEAT_OPERATOR_INVALID);
fprintf(stdout,
"\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
diff --git a/test/testc.c b/test/testc.c
index 5c60764..fbede67 100644
--- a/test/testc.c
+++ b/test/testc.c
@@ -1,17 +1,12 @@
/*
* testc.c
- * Copyright (c) 2019 K.Kosako
+ * Copyright (c) 2019-2020 K.Kosako
*/
#include "config.h"
#include <stdio.h>
+#include <string.h>
-#ifdef POSIX_TEST
-#include "onigposix.h"
-#else
#include "oniguruma.h"
-#endif
-
-#include <string.h>
#define SLEN(s) strlen(s)
@@ -20,66 +15,11 @@ static int nfail = 0;
static int nerror = 0;
static FILE* err_file;
-
-#ifndef POSIX_TEST
static OnigRegion* region;
-#endif
static void xx(char* pattern, char* str, int from, int to, int mem, int not)
{
int r;
-
-#ifdef POSIX_TEST
- regex_t reg;
- char buf[200];
- regmatch_t pmatch[25];
-
- r = regcomp(&reg, pattern, REG_EXTENDED | REG_NEWLINE);
- if (r) {
- regerror(r, &reg, buf, sizeof(buf));
- fprintf(err_file, "ERROR: %s\n", buf);
- nerror++;
- return ;
- }
-
- r = regexec(&reg, str, reg.re_nsub + 1, pmatch, 0);
- if (r != 0 && r != REG_NOMATCH) {
- regerror(r, &reg, buf, sizeof(buf));
- fprintf(err_file, "ERROR: %s\n", buf);
- nerror++;
- return ;
- }
-
- if (r == REG_NOMATCH) {
- if (not) {
- fprintf(stdout, "OK(N): /%s/ '%s'\n", pattern, str);
- nsucc++;
- }
- else {
- fprintf(stdout, "FAIL: /%s/ '%s'\n", pattern, str);
- nfail++;
- }
- }
- else {
- if (not) {
- fprintf(stdout, "FAIL(N): /%s/ '%s'\n", pattern, str);
- nfail++;
- }
- else {
- if (pmatch[mem].rm_so == from && pmatch[mem].rm_eo == to) {
- fprintf(stdout, "OK: /%s/ '%s'\n", pattern, str);
- nsucc++;
- }
- else {
- fprintf(stdout, "FAIL: /%s/ '%s' %d-%d : %d-%d\n", pattern, str,
- from, to, pmatch[mem].rm_so, pmatch[mem].rm_eo);
- nfail++;
- }
- }
- }
- regfree(&reg);
-
-#else
regex_t* reg;
OnigErrorInfo einfo;
@@ -132,7 +72,6 @@ static void xx(char* pattern, char* str, int from, int to, int mem, int not)
}
}
onig_free(reg);
-#endif
}
static void x2(char* pattern, char* str, int from, int to)
@@ -152,20 +91,13 @@ static void n(char* pattern, char* str)
extern int main(int argc, char* argv[])
{
-#ifndef POSIX_TEST
OnigEncoding use_encs[1];
use_encs[0] = ONIG_ENCODING_EUC_JP;
onig_initialize(use_encs, sizeof(use_encs)/sizeof(use_encs[0]));
-#endif
err_file = stdout;
-
-#ifdef POSIX_TEST
- reg_set_encoding(REG_POSIX_ENCODING_EUC_JP);
-#else
region = onig_region_new();
-#endif
x2("", "", 0, 0);
x2("^", "", 0, 0);
@@ -961,19 +893,15 @@ extern int main(int argc, char* argv[])
x2(".<b>�С������Υ����������<\\/b>", "a<b>�С������Υ����������</b>", 0, 32);
x2("\\n?\\z", "����ˤ���", 10, 10);
-#ifndef POSIX_TEST
x2("\\p{Hiragana}", "��", 0, 2);
n("\\P{Hiragana}", "��");
-#endif
fprintf(stdout,
"\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
nsucc, nfail, nerror, onig_version());
-#ifndef POSIX_TEST
onig_region_free(region, 1);
onig_end();
-#endif
return ((nfail == 0 && nerror == 0) ? 0 : -1);
}
diff --git a/test/testp.c b/test/testp.c
new file mode 100644
index 0000000..b88d0e3
--- /dev/null
+++ b/test/testp.c
@@ -0,0 +1,614 @@
+/*
+ * testp.c
+ * Copyright (c) 2020 K.Kosako
+ */
+#include "config.h"
+#include <stdio.h>
+#include <string.h>
+
+#include "onigposix.h"
+
+#define SLEN(s) strlen(s)
+
+static int nsucc = 0;
+static int nfail = 0;
+static int nerror = 0;
+
+static FILE* err_file;
+
+static void
+xx(char* pattern, char* str, int from, int to, int mem, int not)
+{
+ int r;
+ regex_t reg;
+ char buf[200];
+ regmatch_t pmatch[25];
+
+ r = regcomp(&reg, pattern, REG_EXTENDED | REG_NEWLINE);
+ if (r) {
+ regerror(r, &reg, buf, sizeof(buf));
+ fprintf(err_file, "ERROR: %s\n", buf);
+ nerror++;
+ return ;
+ }
+
+ r = regexec(&reg, str, reg.re_nsub + 1, pmatch, 0);
+ if (r != 0 && r != REG_NOMATCH) {
+ regerror(r, &reg, buf, sizeof(buf));
+ fprintf(err_file, "ERROR: %s\n", buf);
+ nerror++;
+ return ;
+ }
+
+ if (r == REG_NOMATCH) {
+ if (not) {
+ fprintf(stdout, "OK(N): /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ }
+ else {
+ if (not) {
+ fprintf(stdout, "FAIL(N): /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ else {
+ if (pmatch[mem].rm_so == from && pmatch[mem].rm_eo == to) {
+ fprintf(stdout, "OK: /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s' %d-%d : %d-%d\n", pattern, str,
+ from, to, pmatch[mem].rm_so, pmatch[mem].rm_eo);
+ nfail++;
+ }
+ }
+ }
+ regfree(&reg);
+}
+
+static void x2(char* pattern, char* str, int from, int to)
+{
+ xx(pattern, str, from, to, 0, 0);
+}
+
+static void x3(char* pattern, char* str, int from, int to, int mem)
+{
+ xx(pattern, str, from, to, mem, 0);
+}
+
+static void n(char* pattern, char* str)
+{
+ xx(pattern, str, 0, 0, 0, 1);
+}
+
+extern int main(int argc, char* argv[])
+{
+ err_file = stdout;
+
+ reg_set_encoding(REG_POSIX_ENCODING_UTF8);
+
+ x2("", "", 0, 0);
+ x2("^", "", 0, 0);
+ x2("$", "", 0, 0);
+ x2("\\G", "", 0, 0);
+ x2("\\A", "", 0, 0);
+ x2("\\Z", "", 0, 0);
+ x2("\\z", "", 0, 0);
+ x2("^$", "", 0, 0);
+ x2("\\ca", "\001", 0, 1);
+ x2("\\C-b", "\002", 0, 1);
+ x2("\\c\\\\", "\034", 0, 1);
+ x2("q[\\c\\\\]", "q\034", 0, 2);
+ x2("", "a", 0, 0);
+ x2("a", "a", 0, 1);
+ x2("\\x61", "a", 0, 1);
+ x2("aa", "aa", 0, 2);
+ x2("aaa", "aaa", 0, 3);
+ x2("aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", "aaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaaa", 0, 35);
+ x2("ab", "ab", 0, 2);
+ x2("b", "ab", 1, 2);
+ x2("bc", "abc", 1, 3);
+ x2("(?i:#RET#)", "#INS##RET#", 5, 10);
+ x2("\\17", "\017", 0, 1);
+ x2("\\x1f", "\x1f", 0, 1);
+ x2("a(?#....\\\\JJJJ)b", "ab", 0, 2);
+ x2("(?x) G (o O(?-x)oO) g L", "GoOoOgLe", 0, 7);
+ x2(".", "a", 0, 1);
+ n(".", "");
+ x2("..", "ab", 0, 2);
+ x2("\\w", "e", 0, 1);
+ n("\\W", "e");
+ x2("\\s", " ", 0, 1);
+ x2("\\S", "b", 0, 1);
+ x2("\\d", "4", 0, 1);
+ n("\\D", "4");
+ x2("\\b", "z ", 0, 0);
+ x2("\\b", " z", 1, 1);
+ x2("\\B", "zz ", 1, 1);
+ x2("\\B", "z ", 2, 2);
+ x2("\\B", " z", 0, 0);
+ x2("[ab]", "b", 0, 1);
+ n("[ab]", "c");
+ x2("[a-z]", "t", 0, 1);
+ n("[^a]", "a");
+ x2("[^a]", "\n", 0, 1);
+ x2("[]]", "]", 0, 1);
+ n("[^]]", "]");
+ x2("[\\^]+", "0^^1", 1, 3);
+ x2("[b-]", "b", 0, 1);
+ x2("[b-]", "-", 0, 1);
+ x2("[\\w]", "z", 0, 1);
+ n("[\\w]", " ");
+ x2("[\\W]", "b$", 1, 2);
+ x2("[\\d]", "5", 0, 1);
+ n("[\\d]", "e");
+ x2("[\\D]", "t", 0, 1);
+ n("[\\D]", "3");
+ x2("[\\s]", " ", 0, 1);
+ n("[\\s]", "a");
+ x2("[\\S]", "b", 0, 1);
+ n("[\\S]", " ");
+ x2("[\\w\\d]", "2", 0, 1);
+ n("[\\w\\d]", " ");
+ x2("[[:upper:]]", "B", 0, 1);
+ x2("[*[:xdigit:]+]", "+", 0, 1);
+ x2("[*[:xdigit:]+]", "GHIKK-9+*", 6, 7);
+ x2("[*[:xdigit:]+]", "-@^+", 3, 4);
+ n("[[:upper]]", "A");
+ x2("[[:upper]]", ":", 0, 1);
+ x2("[\\044-\\047]", "\046", 0, 1);
+ x2("[\\x5a-\\x5c]", "\x5b", 0, 1);
+ x2("[\\x6A-\\x6D]", "\x6c", 0, 1);
+ n("[\\x6A-\\x6D]", "\x6E");
+ n("^[0-9A-F]+ 0+ UNDEF ", "75F 00000000 SECT14A notype () External | _rb_apply");
+ x2("[\\[]", "[", 0, 1);
+ x2("[\\]]", "]", 0, 1);
+ x2("[&]", "&", 0, 1);
+ x2("[[ab]]", "b", 0, 1);
+ x2("[[ab]c]", "c", 0, 1);
+ n("[[^a]]", "a");
+ n("[^[a]]", "a");
+ x2("[[ab]&&bc]", "b", 0, 1);
+ n("[[ab]&&bc]", "a");
+ n("[[ab]&&bc]", "c");
+ x2("[a-z&&b-y&&c-x]", "w", 0, 1);
+ n("[^a-z&&b-y&&c-x]", "w");
+ x2("[[^a&&a]&&a-z]", "b", 0, 1);
+ n("[[^a&&a]&&a-z]", "a");
+ x2("[[^a-z&&bcdef]&&[^c-g]]", "h", 0, 1);
+ n("[[^a-z&&bcdef]&&[^c-g]]", "c");
+ x2("[^[^abc]&&[^cde]]", "c", 0, 1);
+ x2("[^[^abc]&&[^cde]]", "e", 0, 1);
+ n("[^[^abc]&&[^cde]]", "f");
+ x2("[a-&&-a]", "-", 0, 1);
+ n("[a\\-&&\\-a]", "&");
+ n("\\wabc", " abc");
+ x2("a\\Wbc", "a bc", 0, 4);
+ x2("a.b.c", "aabbc", 0, 5);
+ x2(".\\wb\\W..c", "abb bcc", 0, 7);
+ x2("\\s\\wzzz", " zzzz", 0, 5);
+ x2("aa.b", "aabb", 0, 4);
+ n(".a", "ab");
+ x2(".a", "aa", 0, 2);
+ x2("^a", "a", 0, 1);
+ x2("^a$", "a", 0, 1);
+ x2("^\\w$", "a", 0, 1);
+ n("^\\w$", " ");
+ x2("^\\wab$", "zab", 0, 3);
+ x2("^\\wabcdef$", "zabcdef", 0, 7);
+ x2("^\\w...def$", "zabcdef", 0, 7);
+ x2("\\w\\w\\s\\Waaa\\d", "aa aaa4", 0, 8);
+ x2("\\A\\Z", "", 0, 0);
+ x2("\\Axyz", "xyz", 0, 3);
+ x2("xyz\\Z", "xyz", 0, 3);
+ x2("xyz\\z", "xyz", 0, 3);
+ x2("a\\Z", "a", 0, 1);
+ x2("\\Gaz", "az", 0, 2);
+ n("\\Gz", "bza");
+ n("az\\G", "az");
+ n("az\\A", "az");
+ n("a\\Az", "az");
+ x2("\\^\\$", "^$", 0, 2);
+ x2("^x?y", "xy", 0, 2);
+ x2("^(x?y)", "xy", 0, 2);
+ x2("\\w", "_", 0, 1);
+ n("\\W", "_");
+ x2("(?=z)z", "z", 0, 1);
+ n("(?=z).", "a");
+ x2("(?!z)a", "a", 0, 1);
+ n("(?!z)a", "z");
+ x2("(?i:a)", "a", 0, 1);
+ x2("(?i:a)", "A", 0, 1);
+ x2("(?i:A)", "a", 0, 1);
+ n("(?i:A)", "b");
+ x2("(?i:[A-Z])", "a", 0, 1);
+ x2("(?i:[f-m])", "H", 0, 1);
+ x2("(?i:[f-m])", "h", 0, 1);
+ n("(?i:[f-m])", "e");
+ x2("(?i:[A-c])", "D", 0, 1);
+ n("(?i:[^a-z])", "A");
+ n("(?i:[^a-z])", "a");
+ x2("(?i:[!-k])", "Z", 0, 1);
+ x2("(?i:[!-k])", "7", 0, 1);
+ x2("(?i:[T-}])", "b", 0, 1);
+ x2("(?i:[T-}])", "{", 0, 1);
+ x2("(?i:\\?a)", "?A", 0, 2);
+ x2("(?i:\\*A)", "*a", 0, 2);
+ n(".", "\n");
+ x2("(?m:.)", "\n", 0, 1);
+ x2("(?m:a.)", "a\n", 0, 2);
+ x2("(?m:.b)", "a\nb", 1, 3);
+ x2(".*abc", "dddabdd\nddabc", 8, 13);
+ x2("(?m:.*abc)", "dddabddabc", 0, 10);
+ n("(?i)(?-i)a", "A");
+ n("(?i)(?-i:a)", "A");
+ x2("a?", "", 0, 0);
+ x2("a?", "b", 0, 0);
+ x2("a?", "a", 0, 1);
+ x2("a*", "", 0, 0);
+ x2("a*", "a", 0, 1);
+ x2("a*", "aaa", 0, 3);
+ x2("a*", "baaaa", 0, 0);
+ n("a+", "");
+ x2("a+", "a", 0, 1);
+ x2("a+", "aaaa", 0, 4);
+ x2("a+", "aabbb", 0, 2);
+ x2("a+", "baaaa", 1, 5);
+ x2(".?", "", 0, 0);
+ x2(".?", "f", 0, 1);
+ x2(".?", "\n", 0, 0);
+ x2(".*", "", 0, 0);
+ x2(".*", "abcde", 0, 5);
+ x2(".+", "z", 0, 1);
+ x2(".+", "zdswer\n", 0, 6);
+ x2("(.*)a\\1f", "babfbac", 0, 4);
+ x2("(.*)a\\1f", "bacbabf", 3, 7);
+ x2("((.*)a\\2f)", "bacbabf", 3, 7);
+ x2("(.*)a\\1f", "baczzzzzz\nbazz\nzzzzbabf", 19, 23);
+ x2("a|b", "a", 0, 1);
+ x2("a|b", "b", 0, 1);
+ x2("|a", "a", 0, 0);
+ x2("(|a)", "a", 0, 0);
+ x2("ab|bc", "ab", 0, 2);
+ x2("ab|bc", "bc", 0, 2);
+ x2("z(?:ab|bc)", "zbc", 0, 3);
+ x2("a(?:ab|bc)c", "aabc", 0, 4);
+ x2("ab|(?:ac|az)", "az", 0, 2);
+ x2("a|b|c", "dc", 1, 2);
+ x2("a|b|cd|efg|h|ijk|lmn|o|pq|rstuvwx|yz", "pqr", 0, 2);
+ n("a|b|cd|efg|h|ijk|lmn|o|pq|rstuvwx|yz", "mn");
+ x2("a|^z", "ba", 1, 2);
+ x2("a|^z", "za", 0, 1);
+ x2("a|\\Gz", "bza", 2, 3);
+ x2("a|\\Gz", "za", 0, 1);
+ x2("a|\\Az", "bza", 2, 3);
+ x2("a|\\Az", "za", 0, 1);
+ x2("a|b\\Z", "ba", 1, 2);
+ x2("a|b\\Z", "b", 0, 1);
+ x2("a|b\\z", "ba", 1, 2);
+ x2("a|b\\z", "b", 0, 1);
+ x2("\\w|\\s", " ", 0, 1);
+ n("\\w|\\w", " ");
+ x2("\\w|%", "%", 0, 1);
+ x2("\\w|[&$]", "&", 0, 1);
+ x2("[b-d]|[^e-z]", "a", 0, 1);
+ x2("(?:a|[c-f])|bz", "dz", 0, 1);
+ x2("(?:a|[c-f])|bz", "bz", 0, 2);
+ x2("abc|(?=zz)..f", "zzf", 0, 3);
+ x2("abc|(?!zz)..f", "abf", 0, 3);
+ x2("(?=za)..a|(?=zz)..a", "zza", 0, 3);
+ n("(?>a|abd)c", "abdc");
+ x2("(?>abd|a)c", "abdc", 0, 4);
+ x2("a?|b", "a", 0, 1);
+ x2("a?|b", "b", 0, 0);
+ x2("a?|b", "", 0, 0);
+ x2("a*|b", "aa", 0, 2);
+ x2("a*|b*", "ba", 0, 0);
+ x2("a*|b*", "ab", 0, 1);
+ x2("a+|b*", "", 0, 0);
+ x2("a+|b*", "bbb", 0, 3);
+ x2("a+|b*", "abbb", 0, 1);
+ n("a+|b+", "");
+ x2("(a|b)?", "b", 0, 1);
+ x2("(a|b)*", "ba", 0, 2);
+ x2("(a|b)+", "bab", 0, 3);
+ x2("(ab|ca)+", "caabbc", 0, 4);
+ x2("(ab|ca)+", "aabca", 1, 5);
+ x2("(ab|ca)+", "abzca", 0, 2);
+ x2("(a|bab)+", "ababa", 0, 5);
+ x2("(a|bab)+", "ba", 1, 2);
+ x2("(a|bab)+", "baaaba", 1, 4);
+ x2("(?:a|b)(?:a|b)", "ab", 0, 2);
+ x2("(?:a*|b*)(?:a*|b*)", "aaabbb", 0, 3);
+ x2("(?:a*|b*)(?:a+|b+)", "aaabbb", 0, 6);
+ x2("(?:a+|b+){2}", "aaabbb", 0, 6);
+ x2("h{0,}", "hhhh", 0, 4);
+ x2("(?:a+|b+){1,2}", "aaabbb", 0, 6);
+ n("ax{2}*a", "0axxxa1");
+ n("a.{0,2}a", "0aXXXa0");
+ n("a.{0,2}?a", "0aXXXa0");
+ n("a.{0,2}?a", "0aXXXXa0");
+ x2("^a{2,}?a$", "aaa", 0, 3);
+ x2("^[a-z]{2,}?$", "aaa", 0, 3);
+ x2("(?:a+|\\Ab*)cc", "cc", 0, 2);
+ n("(?:a+|\\Ab*)cc", "abcc");
+ x2("(?:^a+|b+)*c", "aabbbabc", 6, 8);
+ x2("(?:^a+|b+)*c", "aabbbbc", 0, 7);
+ x2("a|(?i)c", "C", 0, 1);
+ x2("(?i)c|a", "C", 0, 1);
+ x2("(?i)c|a", "A", 0, 1);
+ x2("(?i:c)|a", "C", 0, 1);
+ n("(?i:c)|a", "A");
+ x2("[abc]?", "abc", 0, 1);
+ x2("[abc]*", "abc", 0, 3);
+ x2("[^abc]*", "abc", 0, 0);
+ n("[^abc]+", "abc");
+ x2("a?\?", "aaa", 0, 0);
+ x2("ba?\?b", "bab", 0, 3);
+ x2("a*?", "aaa", 0, 0);
+ x2("ba*?", "baa", 0, 1);
+ x2("ba*?b", "baab", 0, 4);
+ x2("a+?", "aaa", 0, 1);
+ x2("ba+?", "baa", 0, 2);
+ x2("ba+?b", "baab", 0, 4);
+ x2("(?:a?)?\?", "a", 0, 0);
+ x2("(?:a?\?)?", "a", 0, 0);
+ x2("(?:a?)+?", "aaa", 0, 1);
+ x2("(?:a+)?\?", "aaa", 0, 0);
+ x2("(?:a+)?\?b", "aaab", 0, 4);
+ x2("(?:ab)?{2}", "", 0, 0);
+ x2("(?:ab)?{2}", "ababa", 0, 4);
+ x2("(?:ab)*{0}", "ababa", 0, 0);
+ x2("(?:ab){3,}", "abababab", 0, 8);
+ n("(?:ab){3,}", "abab");
+ x2("(?:ab){2,4}", "ababab", 0, 6);
+ x2("(?:ab){2,4}", "ababababab", 0, 8);
+ x2("(?:ab){2,4}?", "ababababab", 0, 4);
+ x2("(?:ab){,}", "ab{,}", 0, 5);
+ x2("(?:abc)+?{2}", "abcabcabc", 0, 6);
+ x2("(?:X*)(?i:xa)", "XXXa", 0, 4);
+ x2("(d+)([^abc]z)", "dddz", 0, 4);
+ x2("([^abc]*)([^abc]z)", "dddz", 0, 4);
+ x2("(\\w+)(\\wz)", "dddz", 0, 4);
+ x3("(a)", "a", 0, 1, 1);
+ x3("(ab)", "ab", 0, 2, 1);
+ x2("((ab))", "ab", 0, 2);
+ x3("((ab))", "ab", 0, 2, 1);
+ x3("((ab))", "ab", 0, 2, 2);
+ x3("((((((((((((((((((((ab))))))))))))))))))))", "ab", 0, 2, 20);
+ x3("(ab)(cd)", "abcd", 0, 2, 1);
+ x3("(ab)(cd)", "abcd", 2, 4, 2);
+ x3("()(a)bc(def)ghijk", "abcdefghijk", 3, 6, 3);
+ x3("(()(a)bc(def)ghijk)", "abcdefghijk", 3, 6, 4);
+ x2("(^a)", "a", 0, 1);
+ x3("(a)|(a)", "ba", 1, 2, 1);
+ x3("(^a)|(a)", "ba", 1, 2, 2);
+ x3("(a?)", "aaa", 0, 1, 1);
+ x3("(a*)", "aaa", 0, 3, 1);
+ x3("(a*)", "", 0, 0, 1);
+ x3("(a+)", "aaaaaaa", 0, 7, 1);
+ x3("(a+|b*)", "bbbaa", 0, 3, 1);
+ x3("(a+|b?)", "bbbaa", 0, 1, 1);
+ x3("(abc)?", "abc", 0, 3, 1);
+ x3("(abc)*", "abc", 0, 3, 1);
+ x3("(abc)+", "abc", 0, 3, 1);
+ x3("(xyz|abc)+", "abc", 0, 3, 1);
+ x3("([xyz][abc]|abc)+", "abc", 0, 3, 1);
+ x3("((?i:abc))", "AbC", 0, 3, 1);
+ x2("(abc)(?i:\\1)", "abcABC", 0, 6);
+ x3("((?m:a.c))", "a\nc", 0, 3, 1);
+ x3("((?=az)a)", "azb", 0, 1, 1);
+ x3("abc|(.abd)", "zabd", 0, 4, 1);
+ x2("(?:abc)|(ABC)", "abc", 0, 3);
+ x3("(?i:(abc))|(zzz)", "ABC", 0, 3, 1);
+ x3("a*(.)", "aaaaz", 4, 5, 1);
+ x3("a*?(.)", "aaaaz", 0, 1, 1);
+ x3("a*?(c)", "aaaac", 4, 5, 1);
+ x3("[bcd]a*(.)", "caaaaz", 5, 6, 1);
+ x3("(\\Abb)cc", "bbcc", 0, 2, 1);
+ n("(\\Abb)cc", "zbbcc");
+ x3("(^bb)cc", "bbcc", 0, 2, 1);
+ n("(^bb)cc", "zbbcc");
+ x3("cc(bb$)", "ccbb", 2, 4, 1);
+ n("cc(bb$)", "ccbbb");
+ n("(\\1)", "");
+ n("\\1(a)", "aa");
+ n("(a(b)\\1)\\2+", "ababb");
+ n("(?:(?:\\1|z)(a))+$", "zaa");
+ x2("(?:(?:\\1|z)(a))+$", "zaaa", 0, 4);
+ x2("(a)(?=\\1)", "aa", 0, 1);
+ n("(a)$|\\1", "az");
+ x2("(a)\\1", "aa", 0, 2);
+ n("(a)\\1", "ab");
+ x2("(a?)\\1", "aa", 0, 2);
+ x2("(a?\?)\\1", "aa", 0, 0);
+ x2("(a*)\\1", "aaaaa", 0, 4);
+ x3("(a*)\\1", "aaaaa", 0, 2, 1);
+ x2("a(b*)\\1", "abbbb", 0, 5);
+ x2("a(b*)\\1", "ab", 0, 1);
+ x2("(a*)(b*)\\1\\2", "aaabbaaabb", 0, 10);
+ x2("(a*)(b*)\\2", "aaabbbb", 0, 7);
+ x2("(((((((a*)b))))))c\\7", "aaabcaaa", 0, 8);
+ x3("(((((((a*)b))))))c\\7", "aaabcaaa", 0, 3, 7);
+ x2("(a)(b)(c)\\2\\1\\3", "abcbac", 0, 6);
+ x2("([a-d])\\1", "cc", 0, 2);
+ x2("(\\w\\d\\s)\\1", "f5 f5 ", 0, 6);
+ n("(\\w\\d\\s)\\1", "f5 f5");
+ x2("(who|[a-c]{3})\\1", "whowho", 0, 6);
+ x2("...(who|[a-c]{3})\\1", "abcwhowho", 0, 9);
+ x2("(who|[a-c]{3})\\1", "cbccbc", 0, 6);
+ x2("(^a)\\1", "aa", 0, 2);
+ n("(^a)\\1", "baa");
+ n("(a$)\\1", "aa");
+ n("(ab\\Z)\\1", "ab");
+ x2("(a*\\Z)\\1", "a", 1, 1);
+ x2(".(a*\\Z)\\1", "ba", 1, 2);
+ x3("(.(abc)\\2)", "zabcabc", 0, 7, 1);
+ x3("(.(..\\d.)\\2)", "z12341234", 0, 9, 1);
+ x2("((?i:az))\\1", "AzAz", 0, 4);
+ n("((?i:az))\\1", "Azaz");
+ x2("(?<=a)b", "ab", 1, 2);
+ n("(?<=a)b", "bb");
+ x2("(?<=a|b)b", "bb", 1, 2);
+ x2("(?<=a|bc)b", "bcb", 2, 3);
+ x2("(?<=a|bc)b", "ab", 1, 2);
+ x2("(?<=a|bc||defghij|klmnopq|r)z", "rz", 1, 2);
+ x2("(a)\\g<1>", "aa", 0, 2);
+ x2("(?<!a)b", "cb", 1, 2);
+ n("(?<!a)b", "ab");
+ x2("(?<!a|bc)b", "bbb", 0, 1);
+ n("(?<!a|bc)z", "bcz");
+ x2("(?<name1>a)", "a", 0, 1);
+ x2("(?<name_2>ab)\\g<name_2>", "abab", 0, 4);
+ x2("(?<name_3>.zv.)\\k<name_3>", "azvbazvb", 0, 8);
+ x2("(?<=\\g<ab>)|-\\zEND (?<ab>XyZ)", "XyZ", 3, 3);
+ x2("(?<n>|a\\g<n>)+", "", 0, 0);
+ x2("(?<n>|\\(\\g<n>\\))+$", "()(())", 0, 6);
+ x3("\\g<n>(?<n>.){0}", "X", 0, 1, 1);
+ x2("\\g<n>(abc|df(?<n>.YZ){2,8}){0}", "XYZ", 0, 3);
+ x2("\\A(?<n>(a\\g<n>)|)\\z", "aaaa", 0, 4);
+ x2("(?<n>|\\g<m>\\g<n>)\\z|\\zEND (?<m>a|(b)\\g<m>)", "bbbbabba", 0, 8);
+ x2("(?<name1240>\\w+\\sx)a+\\k<name1240>", " fg xaaaaaaaafg x", 2, 18);
+ x3("(z)()()(?<_9>a)\\g<_9>", "zaa", 2, 3, 1);
+ x2("(.)(((?<_>a)))\\k<_>", "zaa", 0, 3);
+ x2("((?<name1>\\d)|(?<name2>\\w))(\\k<name1>|\\k<name2>)", "ff", 0, 2);
+ x2("(?:(?<x>)|(?<x>efg))\\k<x>", "", 0, 0);
+ x2("(?:(?<x>abc)|(?<x>efg))\\k<x>", "abcefgefg", 3, 9);
+ n("(?:(?<x>abc)|(?<x>efg))\\k<x>", "abcefg");
+ x2("(?:(?<n1>.)|(?<n1>..)|(?<n1>...)|(?<n1>....)|(?<n1>.....)|(?<n1>......)|(?<n1>.......)|(?<n1>........)|(?<n1>.........)|(?<n1>..........)|(?<n1>...........)|(?<n1>............)|(?<n1>.............)|(?<n1>..............))\\k<n1>$", "a-pyumpyum", 2, 10);
+ x3("(?:(?<n1>.)|(?<n1>..)|(?<n1>...)|(?<n1>....)|(?<n1>.....)|(?<n1>......)|(?<n1>.......)|(?<n1>........)|(?<n1>.........)|(?<n1>..........)|(?<n1>...........)|(?<n1>............)|(?<n1>.............)|(?<n1>..............))\\k<n1>$", "xxxxabcdefghijklmnabcdefghijklmn", 4, 18, 14);
+ x3("(?<name1>)(?<name2>)(?<name3>)(?<name4>)(?<name5>)(?<name6>)(?<name7>)(?<name8>)(?<name9>)(?<name10>)(?<name11>)(?<name12>)(?<name13>)(?<name14>)(?<name15>)(?<name16>aaa)(?<name17>)$", "aaa", 0, 3, 16);
+ x2("(?<foo>a|\\(\\g<foo>\\))", "a", 0, 1);
+ x2("(?<foo>a|\\(\\g<foo>\\))", "((((((a))))))", 0, 13);
+ x3("(?<foo>a|\\(\\g<foo>\\))", "((((((((a))))))))", 0, 17, 1);
+ x2("\\g<bar>|\\zEND(?<bar>.*abc$)", "abcxxxabc", 0, 9);
+ x2("\\g<1>|\\zEND(.a.)", "bac", 0, 3);
+ x3("\\g<_A>\\g<_A>|\\zEND(.a.)(?<_A>.b.)", "xbxyby", 3, 6, 1);
+ x2("\\A(?:\\g<pon>|\\g<pan>|\\zEND (?<pan>a|c\\g<pon>c)(?<pon>b|d\\g<pan>d))$", "cdcbcdc", 0, 7);
+ x2("\\A(?<n>|a\\g<m>)\\z|\\zEND (?<m>\\g<n>)", "aaaa", 0, 4);
+ x2("(?<n>(a|b\\g<n>c){3,5})", "baaaaca", 1, 5);
+ x2("(?<n>(a|b\\g<n>c){3,5})", "baaaacaaaaa", 0, 10);
+ x2("(?<pare>\\(([^\\(\\)]++|\\g<pare>)*+\\))", "((a))", 0, 5);
+ x2("()*\\1", "", 0, 0);
+ x2("(?:()|())*\\1\\2", "", 0, 0);
+ x3("(?:\\1a|())*", "a", 0, 0, 1);
+ x2("x((.)*)*x", "0x1x2x3", 1, 6);
+ x2("x((.)*)*x(?i:\\1)\\Z", "0x1x2x1X2", 1, 9);
+ x2("(?:()|()|()|()|()|())*\\2\\5", "", 0, 0);
+ x2("(?:()|()|()|(x)|()|())*\\2b\\5", "b", 0, 1);
+ x2("[0-9-a]", "-", 0, 1); // PR#44
+ n("[0-9-a]", ":"); // PR#44
+ x3("(\\(((?:[^(]|\\g<1>)*)\\))", "(abc)(abc)", 1, 4, 2); // PR#43
+ x2("\\o{101}", "A", 0, 1);
+ x2("(?:\\k'+1'B|(A)C)*", "ACAB", 0, 4); // relative backref by postitive number
+ x2("\\g<+2>(abc)(ABC){0}", "ABCabc", 0, 6); // relative call by positive number
+ x2("A\\g'0'|B()", "AAAAB", 0, 5);
+ x3("(A\\g'0')|B", "AAAAB", 0, 5, 1);
+ x2("(a*)(?(1))aa", "aaaaa", 0, 5);
+ x2("(a*)(?(-1))aa", "aaaaa", 0, 5);
+ x2("(?<name>aaa)(?('name'))aa", "aaaaa", 0, 5);
+ x2("(a)(?(1)aa|bb)a", "aaaaa", 0, 4);
+ x2("(?:aa|())(?(<1>)aa|bb)a", "aabba", 0, 5);
+ x2("(?:aa|())(?('1')aa|bb|cc)a", "aacca", 0, 5);
+ x3("(a*)(?(1)aa|a)b", "aaab", 0, 1, 1);
+ n("(a)(?(1)a|b)c", "abc");
+ x2("(a)(?(1)|)c", "ac", 0, 2);
+ n("(?()aaa|bbb)", "bbb");
+ x2("(a)(?(1+0)b|c)d", "abd", 0, 3);
+ x2("(?:(?'name'a)|(?'name'b))(?('name')c|d)e", "ace", 0, 3);
+ x2("(?:(?'name'a)|(?'name'b))(?('name')c|d)e", "bce", 0, 3);
+ x2("\\R", "\r\n", 0, 2);
+ x2("\\R", "\r", 0, 1);
+ x2("\\R", "\n", 0, 1);
+ x2("\\R", "\x0b", 0, 1);
+ n("\\R\\n", "\r\n");
+ x2("\\N", "a", 0, 1);
+ n("\\N", "\n");
+ n("(?m:\\N)", "\n");
+ n("(?-m:\\N)", "\n");
+ x2("\\O", "a", 0, 1);
+ x2("\\O", "\n", 0, 1);
+ x2("(?m:\\O)", "\n", 0, 1);
+ x2("(?-m:\\O)", "\n", 0, 1);
+ x2("\\K", "a", 0, 0);
+ x2("a\\K", "a", 1, 1);
+ x2("a\\Kb", "ab", 1, 2);
+ x2("(a\\Kb|ac\\Kd)", "acd", 2, 3);
+ x2("(a\\Kb|\\Kac\\K)*", "acababacab", 9, 10);
+
+ x2("(?~)", "", 0, 0);
+ x2("(?~)", "A", 0, 0);
+ x2("aaaaa(?~)", "aaaaaaaaaa", 0, 5);
+ x2("(?~(?:|aaa))", "aaa", 0, 0);
+ x2("(?~aaa|)", "aaa", 0, 0);
+ x2("a(?~(?~)).", "abcdefghijklmnopqrstuvwxyz", 0, 26); // !!!
+ x2("/\\*(?~\\*/)\\*/", "/* */ */", 0, 5);
+ x2("(?~\\w+)zzzzz", "zzzzz", 0, 5);
+ x2("(?~\\w*)zzzzz", "zzzzz", 0, 5);
+ x2("(?~A.C|B)", "ABC", 0, 0);
+ x2("(?~XYZ|ABC)a", "ABCa", 1, 4);
+ x2("(?~XYZ|ABC)a", "aABCa", 0, 1);
+ x2("<[^>]*>(?~[<>])</[^>]*>", "<a>vvv</a> <b> </b>", 0, 10);
+ x2("(?~ab)", "ccc\ndab", 0, 5);
+ x2("(?m:(?~ab))", "ccc\ndab", 0, 5);
+ x2("(?-m:(?~ab))", "ccc\ndab", 0, 5);
+ x2("(?~abc)xyz", "xyz012345678901234567890123456789abc", 0, 3);
+
+ // absent with expr
+ x2("(?~|78|\\d*)", "123456789", 0, 6);
+ x2("(?~|def|(?:abc|de|f){0,100})", "abcdedeabcfdefabc", 0, 11);
+ x2("(?~|ab|.*)", "ccc\nddd", 0, 3);
+ x2("(?~|ab|\\O*)", "ccc\ndab", 0, 5);
+ x2("(?~|ab|\\O{2,10})", "ccc\ndab", 0, 5);
+ x2("(?~|ab|\\O{1,10})", "ab", 1, 2);
+ n("(?~|ab|\\O{2,10})", "ab");
+ x2("(?~|abc|\\O{1,10})", "abc", 1, 3);
+ x2("(?~|ab|\\O{5,10})|abc", "abc", 0, 3);
+ x2("(?~|ab|\\O{1,10})", "cccccccccccab", 0, 10);
+ x2("(?~|aaa|)", "aaa", 0, 0);
+ x2("(?~||a*)", "aaaaaa", 0, 0);
+ x2("(?~||a*?)", "aaaaaa", 0, 0);
+ x2("(a)(?~|b|\\1)", "aaaaaa", 0, 2);
+ x2("(a)(?~|bb|(?:a\\1)*)", "aaaaaa", 0, 5);
+ x2("(b|c)(?~|abac|(?:a\\1)*)", "abababacabab", 1, 4);
+ n("(?~|c|a*+)a", "aaaaa");
+ x2("(?~|aaaaa|a*+)", "aaaaa", 0, 0);
+ x2("(?~|aaaaaa|a*+)b", "aaaaaab", 1, 7);
+ x2("(?~|abcd|(?>))", "zzzabcd", 0, 0);
+ x2("(?~|abc|a*?)", "aaaabc", 0, 0);
+
+ // absent stopper
+ x2("(?~|abc)a*", "aaaaaabc", 0, 5);
+ x2("(?~|abc)a*z|aaaaaabc", "aaaaaabc", 0, 8);
+ x2("(?~|aaaaaa)a*", "aaaaaa", 0, 0);
+ x2("(?~|abc)aaaa|aaaabc", "aaaabc", 0, 6);
+ x2("(?>(?~|abc))aaaa|aaaabc", "aaaabc", 0, 6);
+ x2("(?~|)a", "a", 0, 1);
+ n("(?~|a)a", "a");
+ x2("(?~|a)(?~|)a", "a", 0, 1);
+ x2("(?~|a).*(?~|)a", "bbbbbbbbbbbbbbbbbbbba", 0, 21);
+ x2("(?~|abc).*(xyz|pqr)(?~|)abc", "aaaaxyzaaapqrabc", 0, 16);
+ x2("(?~|abc).*(xyz|pqr)(?~|)abc", "aaaaxyzaaaabcpqrabc", 11, 19);
+ n("\\A(?~|abc).*(xyz|pqrabc)(?~|)abc", "aaaaxyzaaaabcpqrabcabc");
+ x2("(?~|a)(?~|)c|ab|a|", "ab", 0, 2);
+ x2("(?~|a)((?~|)c|ab|a|)", "ab", 0, 0);
+ x2("(?~|a)((?>(?~|))c|ab|a|)", "ab", 0, 0);
+
+ // extended grapheme cluster
+ // CR + LF
+ n(".\\y\\O", "\x0d\x0a");
+ x2(".\\Y\\O", "\x0d\x0a", 0, 2);
+ n("\\X\\X", "\x0d\x0a");
+ x2("^\\X$", "\x0d\x0a", 0, 2);
+ x2("^\\X\\X\\X$", "ab\x0d\x0a", 0, 4);
+
+ fprintf(stdout,
+ "\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
+ nsucc, nfail, nerror, onig_version());
+
+ return ((nfail == 0 && nerror == 0) ? 0 : -1);
+}