Port test_error_messages

2024-11-24 14:23:52 +08:00 · 2023-12-09 20:47:43 +01:00 · 2023-12-09 20:47:43 +01:00 · d5ccbb6e9c
commit d5ccbb6e9c
parent f3d1e0d63a
3 changed files with 71 additions and 101 deletions
--- a/fish-rust/src/tests/mod.rs
+++ b/fish-rust/src/tests/mod.rs
@ -13,6 +13,7 @@ mod fd_monitor;
 mod highlight;
 mod history;
 mod pager;
+mod parse_util;
 mod parser;
 #[cfg(test)]
 mod redirection;
--- a/fish-rust/src/tests/parse_util.rs
+++ b/fish-rust/src/tests/parse_util.rs
@ -0,0 +1,70 @@
+use pcre2::utf32::Regex;
+
+use crate::ffi_tests::add_test;
+use crate::parse_constants::{
+    ERROR_BAD_VAR_CHAR1, ERROR_BRACKETED_VARIABLE1, ERROR_BRACKETED_VARIABLE_QUOTED1,
+    ERROR_NOT_ARGV_AT, ERROR_NOT_ARGV_COUNT, ERROR_NOT_ARGV_STAR, ERROR_NOT_PID, ERROR_NOT_STATUS,
+    ERROR_NO_VAR_NAME,
+};
+use crate::parse_util::parse_util_detect_errors;
+use crate::wchar::prelude::*;
+use crate::wchar_ext::WExt;
+
+add_test!("test_error_messages", || {
+    // Given a format string, returns a list of non-empty strings separated by format specifiers. The
+    // format specifiers themselves are omitted.
+    fn separate_by_format_specifiers(format: &wstr) -> Vec<&wstr> {
+        let format_specifier_regex = Regex::new(L!(r"%l?[ds]").as_char_slice()).unwrap();
+        let mut result = vec![];
+        let mut offset = 0;
+        for mtch in format_specifier_regex.find_iter(format.as_char_slice()) {
+            let mtch = mtch.unwrap();
+            result.push(&format[offset..mtch.start()]);
+            offset = mtch.end();
+        }
+        result
+    }
+
+    // Given a format string 'format', return true if the string may have been produced by that format
+    // string. We do this by splitting the format string around the format specifiers, and then ensuring
+    // that each of the remaining chunks is found (in order) in the string.
+    fn string_matches_format(s: &wstr, format: &wstr) -> bool {
+        let components = separate_by_format_specifiers(format);
+        let mut idx = 0;
+        for component in components {
+            let Some(relpos) = s[idx..].find(component) else {
+                return false;
+            };
+            idx += relpos + component.len();
+            assert!(idx <= s.len());
+        }
+        true
+    }
+
+    macro_rules! validate {
+        ($src:expr, $error_text_format:expr) => {
+            let mut errors = vec![];
+            let res = parse_util_detect_errors(L!($src), Some(&mut errors), false);
+            assert!(res.is_err());
+            assert!(
+                string_matches_format(&errors[0].text, L!($error_text_format)),
+                "{}",
+                $src
+            );
+        };
+    }
+
+    validate!("echo $^", ERROR_BAD_VAR_CHAR1);
+    validate!("echo foo${a}bar", ERROR_BRACKETED_VARIABLE1);
+    validate!("echo foo\"${a}\"bar", ERROR_BRACKETED_VARIABLE_QUOTED1);
+    validate!("echo foo\"${\"bar", ERROR_BAD_VAR_CHAR1);
+    validate!("echo $?", ERROR_NOT_STATUS);
+    validate!("echo $$", ERROR_NOT_PID);
+    validate!("echo $#", ERROR_NOT_ARGV_COUNT);
+    validate!("echo $@", ERROR_NOT_ARGV_AT);
+    validate!("echo $*", ERROR_NOT_ARGV_STAR);
+    validate!("echo $", ERROR_NO_VAR_NAME);
+    validate!("echo foo\"$\"bar", ERROR_NO_VAR_NAME);
+    validate!("echo \"foo\"$\"bar\"", ERROR_NO_VAR_NAME);
+    validate!("echo foo $ bar", ERROR_NO_VAR_NAME);
+});
--- a/src/fish_tests.cpp
+++ b/src/fish_tests.cpp
@ -1077,106 +1077,6 @@ static void test_input() {
    }
 }

-// Given a format string, returns a list of non-empty strings separated by format specifiers. The
-// format specifiers themselves are omitted.
-static std::vector<wcstring> separate_by_format_specifiers(const wchar_t *format) {
-    std::vector<wcstring> result;
-    const wchar_t *cursor = format;
-    const wchar_t *end = format + std::wcslen(format);
-    while (cursor < end) {
-        const wchar_t *next_specifier = std::wcschr(cursor, '%');
-        if (next_specifier == nullptr) {
-            next_specifier = end;
-        }
-        assert(next_specifier != nullptr);
-
-        // Don't return empty strings.
-        if (next_specifier > cursor) {
-            result.emplace_back(cursor, next_specifier - cursor);
-        }
-
-        // Walk over the format specifier (if any).
-        cursor = next_specifier;
-        if (*cursor != '%') {
-            continue;
-        }
-
-        cursor++;
-        // Flag
-        if (std::wcschr(L"#0- +'", *cursor)) cursor++;
-        // Minimum field width
-        while (iswdigit(*cursor)) cursor++;
-        // Precision
-        if (*cursor == L'.') {
-            cursor++;
-            while (iswdigit(*cursor)) cursor++;
-        }
-        // Length modifier
-        if (!std::wcsncmp(cursor, L"ll", 2) || !std::wcsncmp(cursor, L"hh", 2)) {
-            cursor += 2;
-        } else if (std::wcschr(L"hljtzqL", *cursor)) {
-            cursor++;
-        }
-        // The format specifier itself. We allow any character except NUL.
-        if (*cursor != L'\0') {
-            cursor += 1;
-        }
-        assert(cursor <= end);
-    }
-    return result;
-}
-
-// Given a format string 'format', return true if the string may have been produced by that format
-// string. We do this by splitting the format string around the format specifiers, and then ensuring
-// that each of the remaining chunks is found (in order) in the string.
-static bool string_matches_format(const wcstring &string, const wchar_t *format) {
-    bool result = true;
-    std::vector<wcstring> components = separate_by_format_specifiers(format);
-    size_t idx = 0;
-    for (const auto &component : components) {
-        size_t where = string.find(component, idx);
-        if (where == wcstring::npos) {
-            result = false;
-            break;
-        }
-        idx = where + component.size();
-        assert(idx <= string.size());
-    }
-    return result;
-}
-
-// todo!("port this")
-static void test_error_messages() {
-    say(L"Testing error messages");
-    const struct error_test_t {
-        const wchar_t *src;
-        const wchar_t *error_text_format;
-    } error_tests[] = {{L"echo $^", ERROR_BAD_VAR_CHAR1},
-                       {L"echo foo${a}bar", ERROR_BRACKETED_VARIABLE1},
-                       {L"echo foo\"${a}\"bar", ERROR_BRACKETED_VARIABLE_QUOTED1},
-                       {L"echo foo\"${\"bar", ERROR_BAD_VAR_CHAR1},
-                       {L"echo $?", ERROR_NOT_STATUS},
-                       {L"echo $$", ERROR_NOT_PID},
-                       {L"echo $#", ERROR_NOT_ARGV_COUNT},
-                       {L"echo $@", ERROR_NOT_ARGV_AT},
-                       {L"echo $*", ERROR_NOT_ARGV_STAR},
-                       {L"echo $", ERROR_NO_VAR_NAME},
-                       {L"echo foo\"$\"bar", ERROR_NO_VAR_NAME},
-                       {L"echo \"foo\"$\"bar\"", ERROR_NO_VAR_NAME},
-                       {L"echo foo $ bar", ERROR_NO_VAR_NAME}};
-
-    auto errors = new_parse_error_list();
-    for (const auto &test : error_tests) {
-        errors->clear();
-        parse_util_detect_errors(test.src, &*errors);
-        do_test(!errors->empty());
-        if (!errors->empty()) {
-            do_test1(string_matches_format(*errors->at(0)->text(), test.error_text_format),
-                     test.src);
-        }
-    }
-}
-
 // todo!("port this")
 static void test_wwrite_to_fd() {
    say(L"Testing wwrite_to_fd");
@ -1487,7 +1387,6 @@ static const test_t s_tests[]{
    {TEST_GROUP("enum"), test_enum_array},
    {TEST_GROUP("autosuggestion"), test_autosuggestion_combining},
    {TEST_GROUP("test_abbreviations"), test_abbreviations},
-    {TEST_GROUP("error_messages"), test_error_messages},
    {TEST_GROUP("convert"), test_convert},
    {TEST_GROUP("convert"), test_convert_private_use},
    {TEST_GROUP("convert_ascii"), test_convert_ascii},