summaryrefslogtreecommitdiff
path: root/test/test_syntax.c
diff options
context:
space:
mode:
authorJörg Frings-Fürst <debian@jff.email>2020-04-20 20:33:58 +0200
committerJörg Frings-Fürst <debian@jff.email>2020-04-20 20:33:58 +0200
commit73c6133c32cddae59813cbadf655cb50a3a7356a (patch)
tree0935fb6da7f1d9728b42ddf08395a0e977e1c228 /test/test_syntax.c
parent043fff5b6f2461aeccb1c62cb771826cfe301832 (diff)
parent6b986090d954dbac91bbb3c43ce7c3328c91a780 (diff)
Update upstream source from tag 'upstream/6.9.5'
Update to upstream version '6.9.5' with Debian dir 1312d9badb7f1c47d032cf09765074e8fd80c991
Diffstat (limited to 'test/test_syntax.c')
-rw-r--r--test/test_syntax.c246
1 files changed, 246 insertions, 0 deletions
diff --git a/test/test_syntax.c b/test/test_syntax.c
new file mode 100644
index 0000000..df80e59
--- /dev/null
+++ b/test/test_syntax.c
@@ -0,0 +1,246 @@
+/*
+ * test_syntax.c
+ * Copyright (c) 2019-2020 K.Kosako
+ */
+#include "config.h"
+#ifdef ONIG_ESCAPE_UCHAR_COLLISION
+#undef ONIG_ESCAPE_UCHAR_COLLISION
+#endif
+
+#include <stdio.h>
+#include <string.h>
+#include "oniguruma.h"
+
+#define SLEN(s) strlen(s)
+
+static int nsucc = 0;
+static int nfail = 0;
+static int nerror = 0;
+
+static FILE* err_file;
+
+static OnigRegion* region;
+
+static OnigSyntaxType* Syntax;
+
+static void xx(char* pattern, char* str, int from, int to, int mem, int not,
+ int error_no)
+{
+ int r;
+ regex_t* reg;
+ OnigErrorInfo einfo;
+
+ r = onig_new(&reg, (UChar* )pattern, (UChar* )(pattern + SLEN(pattern)),
+ ONIG_OPTION_DEFAULT, ONIG_ENCODING_UTF8, Syntax, &einfo);
+ if (r) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r, &einfo);
+ fprintf(err_file, "ERROR: %s /%s/\n", s, pattern);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ %d\n", pattern, r);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL(ERROR): /%s/ '%s', %d, %d\n", pattern, str,
+ error_no, r);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ r = onig_search(reg, (UChar* )str, (UChar* )(str + SLEN(str)),
+ (UChar* )str, (UChar* )(str + SLEN(str)),
+ region, ONIG_OPTION_NONE);
+ if (r < ONIG_MISMATCH) {
+ char s[ONIG_MAX_ERROR_MESSAGE_LEN];
+
+ if (error_no == 0) {
+ onig_error_code_to_str((UChar* )s, r);
+ fprintf(err_file, "ERROR: %s /%s/\n", s, pattern);
+ nerror++;
+ }
+ else {
+ if (r == error_no) {
+ fprintf(stdout, "OK(ERROR): /%s/ '%s', %d\n", pattern, str, r);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL ERROR NO: /%s/ '%s', %d, %d\n", pattern, str,
+ error_no, r);
+ nfail++;
+ }
+ }
+
+ return ;
+ }
+
+ if (r == ONIG_MISMATCH) {
+ if (not) {
+ fprintf(stdout, "OK(N): /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ }
+ else {
+ if (not) {
+ fprintf(stdout, "FAIL(N): /%s/ '%s'\n", pattern, str);
+ nfail++;
+ }
+ else {
+ if (region->beg[mem] == from && region->end[mem] == to) {
+ fprintf(stdout, "OK: /%s/ '%s'\n", pattern, str);
+ nsucc++;
+ }
+ else {
+ fprintf(stdout, "FAIL: /%s/ '%s' %d-%d : %d-%d\n", pattern, str,
+ from, to, region->beg[mem], region->end[mem]);
+ nfail++;
+ }
+ }
+ }
+ onig_free(reg);
+}
+
+static void x2(char* pattern, char* str, int from, int to)
+{
+ xx(pattern, str, from, to, 0, 0, 0);
+}
+
+static void x3(char* pattern, char* str, int from, int to, int mem)
+{
+ xx(pattern, str, from, to, mem, 0, 0);
+}
+
+static void n(char* pattern, char* str)
+{
+ xx(pattern, str, 0, 0, 0, 1, 0);
+}
+
+static void e(char* pattern, char* str, int error_no)
+{
+ xx(pattern, str, 0, 0, 0, 0, error_no);
+}
+
+static int test_fixed_interval()
+{
+ x2("a{1,3}?", "aaa", 0, 1);
+ x2("a{3}", "aaa", 0, 3);
+ x2("a{3}?", "aaa", 0, 3);
+ n("a{3}?", "aa");
+ x2("a{3,3}?", "aaa", 0, 3);
+ n("a{3,3}?", "aa");
+
+ x2("a{1,3}+", "aaaaaa", 0, 3);
+ x2("a{3}+", "aaaaaa", 0, 3);
+ x2("a{3,3}+", "aaaaaa", 0, 3);
+
+ return 0;
+}
+
+static int test_isolated_option()
+{
+ x2("", "", 0, 0);
+ x2("^", "", 0, 0);
+ n("^a", "\na");
+ n(".", "\n");
+ x2("(?s:.)", "\n", 0, 1);
+ x2("(?s).", "\n", 0, 1);
+ x2("(?s)a|.", "\n", 0, 1);
+ n("(?s:a)|.", "\n");
+ x2("b(?s)a|.", "\n", 0, 1);
+ n("((?s)a)|.", "\n");
+ n("b(?:(?s)a)|z|.", "\n");
+ n(".|b(?s)a", "\n");
+ n(".(?s)", "\n");
+ n("(?s)(?-s)a|.", "\n");
+ x2("(?s)a|.(?-s)", "\n", 0, 1);
+ x2("(?s)a|((?-s)).", "\n", 0, 1);
+ x2("(?s)a|(?:(?-s)).", "\n", 0, 1); // !!! Perl 5.26.1 returns empty match
+ x2("(?s)a|(?:).", "\n", 0, 1); // !!! Perl 5.26.1 returns empty match
+ x2("(?s)a|(?:.)", "\n", 0, 1);
+ x2("(?s)a|(?:a*).", "\n", 0, 1);
+ n("a|(?:).", "\n"); // !!! Perl 5.26.1 returns empty match
+ n("a|(?:)(.)", "\n");
+ x2("(?s)a|(?:)(.)", "\n", 0, 1);
+ x2("b(?s)a|(?:)(.)", "\n", 0, 1);
+ n("b((?s)a)|(?:)(.)", "\n");
+
+ return 0;
+}
+
+static int test_prec_read()
+{
+ x2("(?=a).b", "ab", 0, 2);
+ x2("(?=ab|(.))\\1", "ab", 1, 2); // doesn't backtrack if success once in prec-read
+ n("(?!(.)z)a\\1", "aa"); // ! Perl 5.26.1 match with "aa"
+
+ return 0;
+}
+
+static int test_look_behind()
+{
+ x2("(?<=a)b", "ab", 1, 2);
+ x2("(?<=a|b)c", "abc", 2, 3);
+ x2("(?<=a|(.))\\1", "abcc", 3, 4);
+
+ // following is not match in Perl and Java
+ //x2("(?<=a|(.))\\1", "aa", 1, 2);
+
+ n("(?<!c|c)a", "ca");
+
+ return 0;
+}
+
+extern int main(int argc, char* argv[])
+{
+ OnigEncoding use_encs[1];
+
+ use_encs[0] = ONIG_ENCODING_UTF8;
+ onig_initialize(use_encs, sizeof(use_encs)/sizeof(use_encs[0]));
+
+ err_file = stdout;
+
+ region = onig_region_new();
+
+ Syntax = ONIG_SYNTAX_PERL;
+
+ test_fixed_interval();
+ test_isolated_option();
+ test_prec_read();
+ test_look_behind();
+ e("(?<=ab|(.))\\1", "abb", ONIGERR_INVALID_LOOK_BEHIND_PATTERN); // Variable length lookbehind not implemented in Perl 5.26.1
+
+ x3("()", "abc", 0, 0, 1);
+ e("(", "", ONIGERR_END_PATTERN_WITH_UNMATCHED_PARENTHESIS);
+ // different spec.
+ // e("\\x{7fffffff}", "", ONIGERR_TOO_BIG_WIDE_CHAR_VALUE);
+
+ Syntax = ONIG_SYNTAX_JAVA;
+
+ test_fixed_interval();
+ test_isolated_option();
+ test_prec_read();
+ test_look_behind();
+ x2("(?<=ab|(.))\\1", "abb", 2, 3);
+ n("(?<!ab|b)c", "bbc");
+ n("(?<!b|ab)c", "bbc");
+
+ fprintf(stdout,
+ "\nRESULT SUCC: %4d, FAIL: %d, ERROR: %d (by Oniguruma %s)\n",
+ nsucc, nfail, nerror, onig_version());
+
+ onig_region_free(region, 1);
+ onig_end();
+
+ return ((nfail == 0 && nerror == 0) ? 0 : -1);
+}