Regex: Fix handling of all unicode codepoint as start chars

2017-10-20 18:26:33 +08:00 · 2017-10-20 18:26:33 +08:00 · 60e32d73ff
commit 60e32d73ff
parent df2bf9601c
1 changed files with 7 additions and 0 deletions
--- a/src/regex_impl.cc
+++ b/src/regex_impl.cc
@ -858,6 +858,8 @@ private:
                    else
                        start_chars.map[node->value] = true;
                }
+                else
+                    start_chars.accept_other = true;
                return node->quantifier.allows_none();
            case ParsedRegex::AnyChar:
                for (auto& b : start_chars.map)
@ -1332,6 +1334,11 @@ auto test_regex = UnitTest{[]{
        kak_assert(vm.exec("abcde"));
    }

+    {
+        TestVM<> vm{R"(д)"};
+        kak_assert(vm.exec("д", RegexExecFlags::Search));
+    }
+
    {
        TestVM<> vm{R"(\0\x0A\u260e\u260F)"};
        const char str[] = "\0\n☎☏"; // work around the null byte in the literal