fish-shell/src/parse_util.cpp

// Various mostly unrelated utility functions related to parsing, loading and evaluating fish code.
//
// This library can be seen as a 'toolbox' for functions that are used in many places in fish and
// that are somehow related to parsing the code.
#include "config.h"  // IWYU pragma: keep

#include "parse_util.h"

#include <stdarg.h>
#include <stdlib.h>

#include <cwchar>
#include <memory>
#include <string>
#include <type_traits>

#include "ast.h"
#include "builtin.h"
#include "common.h"
#include "expand.h"
#include "fallback.h"  // IWYU pragma: keep
#include "future_feature_flags.h"
#include "parse_constants.h"
#include "parse_util.h"
#include "parser.h"
#include "tokenizer.h"
#include "wcstringutil.h"
#include "wildcard.h"
#include "wutil.h"  // IWYU pragma: keep

/// Error message for use of backgrounded commands before and/or.
#define BOOL_AFTER_BACKGROUND_ERROR_MSG \
    _(L"The '%ls' command can not be used immediately after a backgrounded job")

/// Error message for backgrounded commands as conditionals.
#define BACKGROUND_IN_CONDITIONAL_ERROR_MSG \
    _(L"Backgrounded commands can not be used as conditionals")

/// Error message for arguments to 'end'
#define END_ARG_ERR_MSG _(L"'end' does not take arguments. Did you forget a ';'?")

/// Maximum length of a variable name to show in error reports before truncation
static constexpr int var_err_len = 16;

int parse_util_lineno(const wchar_t *str, size_t offset) {
    if (!str) return 0;

    int res = 1;
    for (size_t i = 0; i < offset && str[i] != L'\0'; i++) {
        if (str[i] == L'\n') {
            res++;
        }
    }
    return res;
}

int parse_util_get_line_from_offset(const wcstring &str, size_t pos) {
    const wchar_t *buff = str.c_str();
    int count = 0;
    for (size_t i = 0; i < pos; i++) {
        if (!buff[i]) {
            return -1;
        }

        if (buff[i] == L'\n') {
            count++;
        }
    }
    return count;
}

size_t parse_util_get_offset_from_line(const wcstring &str, int line) {
    const wchar_t *buff = str.c_str();
    size_t i;
    int count = 0;

    if (line < 0) return static_cast<size_t>(-1);
    if (line == 0) return 0;

    for (i = 0;; i++) {
        if (!buff[i]) return static_cast<size_t>(-1);

        if (buff[i] == L'\n') {
            count++;
            if (count == line) {
                return i + 1;
            }
        }
    }
}

size_t parse_util_get_offset(const wcstring &str, int line, long line_offset) {
    size_t off = parse_util_get_offset_from_line(str, line);
    size_t off2 = parse_util_get_offset_from_line(str, line + 1);

    if (off == static_cast<size_t>(-1)) return static_cast<size_t>(-1);
    if (off2 == static_cast<size_t>(-1)) off2 = str.length() + 1;
    if (line_offset < 0) line_offset = 0;  //!OCLINT(parameter reassignment)

    if (static_cast<size_t>(line_offset) >= off2 - off - 1) {
        line_offset = off2 - off - 1;  //!OCLINT(parameter reassignment)
    }

    return off + line_offset;
}

static int parse_util_locate_brackets_of_type(const wchar_t *in, wchar_t **begin, wchar_t **end,
                                              bool allow_incomplete, wchar_t open_type,
                                              wchar_t close_type) {
    // open_type is typically ( or [, and close type is the corresponding value.
    wchar_t *pos;
    bool escaped = false;
    bool syntax_error = false;
    int paran_count = 0;

    wchar_t *paran_begin = nullptr, *paran_end = nullptr;

    assert(in && "null parameter");

    for (pos = const_cast<wchar_t *>(in); *pos; pos++) {
        if (!escaped) {
            if (std::wcschr(L"\'\"", *pos)) {
                wchar_t *q_end = quote_end(pos);
                if (q_end && *q_end) {
                    pos = q_end;
                } else {
                    break;
                }
            } else {
                if (*pos == open_type) {
                    if ((paran_count == 0) && (paran_begin == nullptr)) {
                        paran_begin = pos;
                    }

                    paran_count++;
                } else if (*pos == close_type) {
                    paran_count--;

                    if ((paran_count == 0) && (paran_end == nullptr)) {
                        paran_end = pos;
                        break;
                    }

                    if (paran_count < 0) {
                        syntax_error = true;
                        break;
                    }
                }
            }
        }
        if (*pos == '\\') {
            escaped = !escaped;
        } else {
            escaped = false;
        }
    }

    syntax_error |= (paran_count < 0);
    syntax_error |= ((paran_count > 0) && (!allow_incomplete));

    if (syntax_error) {
        return -1;
    }

    if (paran_begin == nullptr) {
        return 0;
    }

    if (begin) {
        *begin = paran_begin;
    }

    if (end) {
        *end = paran_count ? const_cast<wchar_t *>(in) + std::wcslen(in) : paran_end;
    }

    return 1;
}

int parse_util_locate_cmdsubst(const wchar_t *in, wchar_t **begin, wchar_t **end,
                               bool accept_incomplete) {
    return parse_util_locate_brackets_of_type(in, begin, end, accept_incomplete, L'(', L')');
}

int parse_util_locate_slice(const wchar_t *in, wchar_t **begin, wchar_t **end,
                            bool accept_incomplete) {
    return parse_util_locate_brackets_of_type(in, begin, end, accept_incomplete, L'[', L']');
}

static int parse_util_locate_brackets_range(const wcstring &str, size_t *inout_cursor_offset,
                                            wcstring *out_contents, size_t *out_start,
                                            size_t *out_end, bool accept_incomplete,
                                            wchar_t open_type, wchar_t close_type) {
    // Clear the return values.
    if (out_contents != nullptr) out_contents->clear();
    *out_start = 0;
    *out_end = str.size();

    // Nothing to do if the offset is at or past the end of the string.
    if (*inout_cursor_offset >= str.size()) return 0;

    // Defer to the wonky version.
    const wchar_t *const buff = str.c_str();
    const wchar_t *const valid_range_start = buff + *inout_cursor_offset,
                         *valid_range_end = buff + str.size();
    wchar_t *bracket_range_begin = nullptr, *bracket_range_end = nullptr;
    int ret = parse_util_locate_brackets_of_type(valid_range_start, &bracket_range_begin,
                                                 &bracket_range_end, accept_incomplete, open_type,
                                                 close_type);
    if (ret <= 0) {
        return ret;
    }

    // The command substitutions must not be NULL and must be in the valid pointer range, and
    // the end must be bigger than the beginning.
    assert(bracket_range_begin != nullptr && bracket_range_begin >= valid_range_start &&
           bracket_range_begin <= valid_range_end);
    assert(bracket_range_end != nullptr && bracket_range_end > bracket_range_begin &&
           bracket_range_end >= valid_range_start && bracket_range_end <= valid_range_end);

    // Assign the substring to the out_contents.
    const wchar_t *interior_begin = bracket_range_begin + 1;
    if (out_contents != nullptr) {
        out_contents->assign(interior_begin, bracket_range_end - interior_begin);
    }

    // Return the start and end.
    *out_start = bracket_range_begin - buff;
    *out_end = bracket_range_end - buff;

    // Update the inout_cursor_offset. Note this may cause it to exceed str.size(), though
    // overflow is not likely.
    *inout_cursor_offset = 1 + *out_end;
    return ret;
}

int parse_util_locate_cmdsubst_range(const wcstring &str, size_t *inout_cursor_offset,
                                     wcstring *out_contents, size_t *out_start, size_t *out_end,
                                     bool accept_incomplete) {
    return parse_util_locate_brackets_range(str, inout_cursor_offset, out_contents, out_start,
                                            out_end, accept_incomplete, L'(', L')');
}

void parse_util_cmdsubst_extent(const wchar_t *buff, size_t cursor_pos, const wchar_t **a,
                                const wchar_t **b) {
    assert(buff && "Null buffer");
    const wchar_t *const cursor = buff + cursor_pos;

    const size_t bufflen = std::wcslen(buff);
    assert(cursor_pos <= bufflen);

    // ap and bp are the beginning and end of the tightest command substitution found so far.
    const wchar_t *ap = buff, *bp = buff + bufflen;
    const wchar_t *pos = buff;
    for (;;) {
        wchar_t *begin = nullptr, *end = nullptr;
        if (parse_util_locate_cmdsubst(pos, &begin, &end, true) <= 0) {
            // No subshell found, all done.
            break;
        }
        // Interpret NULL to mean the end.
        if (end == nullptr) {
            end = const_cast<wchar_t *>(buff) + bufflen;
        }

        if (begin < cursor && end >= cursor) {
            // This command substitution surrounds the cursor, so it's a tighter fit.
            begin++;
            ap = begin;
            bp = end;
            // pos is where to begin looking for the next one. But if we reached the end there's no
            // next one.
            if (begin >= end) break;
            pos = begin + 1;
        } else if (begin >= cursor) {
            // This command substitution starts at or after the cursor. Since it was the first
            // command substitution in the string, we're done.
            break;
        } else {
            // This command substitution ends before the cursor. Skip it.
            assert(end < cursor);
            pos = end + 1;
            assert(pos <= buff + bufflen);
        }
    }

    if (a != nullptr) *a = ap;
    if (b != nullptr) *b = bp;
}

/// Get the beginning and end of the job or process definition under the cursor.
static void job_or_process_extent(bool process, const wchar_t *buff, size_t cursor_pos,
                                  const wchar_t **a, const wchar_t **b,
                                  std::vector<tok_t> *tokens) {
    assert(buff && "Null buffer");
    const wchar_t *begin = nullptr, *end = nullptr;
    int finished = 0;

    if (a) *a = nullptr;
    if (b) *b = nullptr;
    parse_util_cmdsubst_extent(buff, cursor_pos, &begin, &end);
    if (!end || !begin) {
        return;
    }

    assert(cursor_pos >= static_cast<size_t>(begin - buff));
    const size_t pos = cursor_pos - (begin - buff);

    if (a) *a = begin;
    if (b) *b = end;

    const wcstring buffcpy(begin, end);
    tokenizer_t tok(buffcpy.c_str(), TOK_ACCEPT_UNFINISHED);
    maybe_t<tok_t> token{};
    while ((token = tok.next()) && !finished) {
        size_t tok_begin = token->offset;

        switch (token->type) {
            case token_type_t::pipe: {
                if (!process) {
                    break;
                }
            }
            /* FALLTHROUGH */
            case token_type_t::end:
            case token_type_t::background:
            case token_type_t::andand:
            case token_type_t::oror:
            case token_type_t::comment: {
                if (tok_begin >= pos) {
                    finished = 1;
                    if (b) *b = const_cast<wchar_t *>(begin) + tok_begin;
                } else {
                    // Statement at cursor might start after this token.
                    if (a) *a = const_cast<wchar_t *>(begin) + tok_begin + token->length;
                    if (tokens) tokens->clear();
                }
                continue;  // Do not add this to tokens
            }
            default: {
                break;
            }
        }
        if (tokens) tokens->push_back(*token);
    }
}

void parse_util_process_extent(const wchar_t *buff, size_t pos, const wchar_t **a,
                               const wchar_t **b, std::vector<tok_t> *tokens) {
    job_or_process_extent(true, buff, pos, a, b, tokens);
}

void parse_util_job_extent(const wchar_t *buff, size_t pos, const wchar_t **a, const wchar_t **b) {
    job_or_process_extent(false, buff, pos, a, b, nullptr);
}

void parse_util_token_extent(const wchar_t *buff, size_t cursor_pos, const wchar_t **tok_begin,
                             const wchar_t **tok_end, const wchar_t **prev_begin,
                             const wchar_t **prev_end) {
    assert(buff && "Null buffer");
    const wchar_t *a = nullptr, *b = nullptr, *pa = nullptr, *pb = nullptr;

    const wchar_t *cmdsubst_begin, *cmdsubst_end;
    parse_util_cmdsubst_extent(buff, cursor_pos, &cmdsubst_begin, &cmdsubst_end);

    if (!cmdsubst_end || !cmdsubst_begin) {
        return;
    }

    // pos is equivalent to cursor_pos within the range of the command substitution {begin, end}.
    size_t offset_within_cmdsubst = cursor_pos - (cmdsubst_begin - buff);

    size_t bufflen = std::wcslen(buff);

    a = cmdsubst_begin + offset_within_cmdsubst;
    b = a;
    pa = cmdsubst_begin + offset_within_cmdsubst;
    pb = pa;

    assert(cmdsubst_begin >= buff);
    assert(cmdsubst_begin <= (buff + bufflen));
    assert(cmdsubst_end >= cmdsubst_begin);
    assert(cmdsubst_end <= (buff + bufflen));

    const wcstring buffcpy = wcstring(cmdsubst_begin, cmdsubst_end - cmdsubst_begin);

    tokenizer_t tok(buffcpy.c_str(), TOK_ACCEPT_UNFINISHED);
    while (maybe_t<tok_t> token = tok.next()) {
        size_t tok_begin = token->offset;
        size_t tok_end = tok_begin;

        // Calculate end of token.
        if (token->type == token_type_t::string) {
            tok_end += token->length;
        }

        // Cursor was before beginning of this token, means that the cursor is between two tokens,
        // so we set it to a zero element string and break.
        if (tok_begin > offset_within_cmdsubst) {
            a = b = cmdsubst_begin + offset_within_cmdsubst;
            break;
        }

        // If cursor is inside the token, this is the token we are looking for. If so, set a and b
        // and break.
        if (token->type == token_type_t::string && tok_end >= offset_within_cmdsubst) {
            a = cmdsubst_begin + token->offset;
            b = a + token->length;
            break;
        }

        // Remember previous string token.
        if (token->type == token_type_t::string) {
            pa = cmdsubst_begin + token->offset;
            pb = pa + token->length;
        }
    }

    if (tok_begin) *tok_begin = a;
    if (tok_end) *tok_end = b;
    if (prev_begin) *prev_begin = pa;
    if (prev_end) *prev_end = pb;

    assert(pa >= buff);
    assert(pa <= (buff + bufflen));
    assert(pb >= pa);
    assert(pb <= (buff + bufflen));
}

wcstring parse_util_unescape_wildcards(const wcstring &str) {
    wcstring result;
    result.reserve(str.size());
    bool unesc_qmark = !feature_test(features_t::qmark_noglob);

    const wchar_t *const cs = str.c_str();
    for (size_t i = 0; cs[i] != L'\0'; i++) {
        if (cs[i] == L'*') {
            result.push_back(ANY_STRING);
        } else if (cs[i] == L'?' && unesc_qmark) {
            result.push_back(ANY_CHAR);
        } else if (cs[i] == L'\\' && cs[i + 1] == L'*') {
            result.push_back(cs[i + 1]);
            i += 1;
        } else if (cs[i] == L'\\' && cs[i + 1] == L'?' && unesc_qmark) {
            result.push_back(cs[i + 1]);
            i += 1;
        } else if (cs[i] == L'\\' && cs[i + 1] == L'\\') {
            // Not a wildcard, but ensure the next iteration doesn't see this escaped backslash.
            result.append(L"\\\\");
            i += 1;
        } else {
            result.push_back(cs[i]);
        }
    }
    return result;
}

/// Find the outermost quoting style of current token. Returns 0 if token is not quoted.
static wchar_t get_quote(const wcstring &cmd_str, size_t len) {
    size_t i = 0;
    wchar_t res = 0;
    const wchar_t *const cmd = cmd_str.c_str();

    while (true) {
        if (!cmd[i]) break;

        if (cmd[i] == L'\\') {
            i++;
            if (!cmd[i]) break;
            i++;
        } else {
            if (cmd[i] == L'\'' || cmd[i] == L'\"') {
                const wchar_t *end = quote_end(&cmd[i]);
                // std::fwprintf( stderr, L"Jump %d\n",  end-cmd );
                if ((end == nullptr) || (!*end) || (end > cmd + len)) {
                    res = cmd[i];
                    break;
                }
                i = end - cmd + 1;
            } else
                i++;
        }
    }

    return res;
}

void parse_util_get_parameter_info(const wcstring &cmd, const size_t pos, wchar_t *quote,
                                   size_t *offset, token_type_t *out_type) {
    size_t prev_pos = 0;
    wchar_t last_quote = L'\0';

    tokenizer_t tok(cmd.c_str(), TOK_ACCEPT_UNFINISHED);
    while (auto token = tok.next()) {
        if (token->offset > pos) break;

        if (token->type == token_type_t::string)
            last_quote = get_quote(tok.text_of(*token), pos - token->offset);

        if (out_type != nullptr) *out_type = token->type;

        prev_pos = token->offset;
    }

    wchar_t *cmd_tmp = wcsdup(cmd.c_str());
    cmd_tmp[pos] = 0;
    size_t cmdlen = pos;
    bool finished = cmdlen != 0;
    if (finished) {
        finished = (quote == nullptr);
        if (finished && std::wcschr(L" \t\n\r", cmd_tmp[cmdlen - 1])) {
            finished = cmdlen > 1 && cmd_tmp[cmdlen - 2] == L'\\';
        }
    }

    if (quote) *quote = last_quote;

    if (offset != nullptr) {
        if (finished) {
            while ((cmd_tmp[prev_pos] != 0) && (std::wcschr(L";|", cmd_tmp[prev_pos]) != nullptr))
                prev_pos++;
            *offset = prev_pos;
        } else {
            *offset = pos;
        }
    }

    free(cmd_tmp);
}

wcstring parse_util_escape_string_with_quote(const wcstring &cmd, wchar_t quote, bool no_tilde) {
    wcstring result;
    if (quote == L'\0') {
        escape_flags_t flags = ESCAPE_ALL | ESCAPE_NO_QUOTED | (no_tilde ? ESCAPE_NO_TILDE : 0);
        result = escape_string(cmd, flags);
    } else {
        // Here we are going to escape a string with quotes.
        // A few characters cannot be represented inside quotes, e.g. newlines. In that case,
        // terminate the quote and then re-enter it.
        result.reserve(cmd.size());
        for (wchar_t c : cmd) {
            switch (c) {
                case L'\n':
                    result.append({quote, L'\\', L'n', quote});
                    break;
                case L'\t':
                    result.append({quote, L'\\', L't', quote});
                    break;
                case L'\b':
                    result.append({quote, L'\\', L'b', quote});
                    break;
                case L'\r':
                    result.append({quote, L'\\', L'r', quote});
                    break;
                case L'\\':
                    result.append({L'\\', L'\\'});
                    break;
                case L'$':
                    if (quote == L'"') result.push_back(L'\\');
                    result.push_back(L'$');
                    break;
                default:
                    if (c == quote) result.push_back(L'\\');
                    result.push_back(c);
                    break;
            }
        }
    }
    return result;
}

std::vector<int> parse_util_compute_indents(const wcstring &src) {
    // Make a vector the same size as the input string, which contains the indents. Initialize them
    // to 0.
    const size_t src_size = src.size();
    std::vector<int> indents(src_size, 0);

    // Simple trick: if our source does not contain a newline, then all indents are 0.
    if (src.find('\n') == wcstring::npos) {
        return indents;
    }

    // Parse the string. We pass continue_after_error to produce a forest; the trailing indent of
    // the last node we visited becomes the input indent of the next. I.e. in the case of 'switch
    // foo ; cas', we get an invalid parse tree (since 'cas' is not valid) but we indent it as if it
    // were a case item list.
    using namespace ast;
    auto ast =
        ast_t::parse(src, parse_flag_continue_after_error | parse_flag_include_comments |
                              parse_flag_accept_incomplete_tokens | parse_flag_leave_unterminated);

    // Visit all of our nodes. When we get a job_list or case_item_list, increment indent while
    // visiting its children.
    struct indent_visitor_t {
        indent_visitor_t(const wcstring &src, std::vector<int> &indents)
            : src(src), indents(indents) {}

        void visit(const node_t &node) {
            int inc = 0;
            int dec = 0;
            switch (node.type) {
                case type_t::job_list:
                case type_t::andor_job_list:
                    // Job lists are never unwound.
                    inc = 1;
                    dec = 1;
                    break;

                // Increment indents for conditions in headers (#1665).
                case type_t::job_conjunction:
                    if (node.parent->type == type_t::while_header ||
                        node.parent->type == type_t::if_clause) {
                        inc = 1;
                        dec = 1;
                    }
                    break;

                // Increment indents for job_continuation_t if it contains a newline.
                // This is a bit of a hack - it indents cases like:
                //    cmd1 |
                //    ....cmd2
                // but avoids "double indenting" if there's no newline:
                //   cmd1 | while cmd2
                //   ....cmd3
                //   end
                // See #7252.
                case type_t::job_continuation:
                    if (has_newline(node.as<job_continuation_t>()->newlines)) {
                        inc = 1;
                        dec = 1;
                    }
                    break;

                // Likewise for && and ||.
                case type_t::job_conjunction_continuation:
                    if (has_newline(node.as<job_conjunction_continuation_t>()->newlines)) {
                        inc = 1;
                        dec = 1;
                    }
                    break;

                case type_t::case_item_list:
                    // Here's a hack. Consider:
                    // switch abc
                    //    cas
                    //
                    // fish will see that 'cas' is not valid inside a switch statement because it is
                    // not "case". It will then unwind back to the top level job list, producing a
                    // parse tree like:
                    //
                    //   job_list
                    //      switch_job
                    //         <err>
                    //      normal_job
                    //         cas
                    //
                    // And so we will think that the 'cas' job is at the same level as the switch.
                    // To address this, if we see that the switch statement was not closed, do not
                    // decrement the indent afterwards.
                    inc = 1;
                    dec = node.parent->as<switch_statement_t>()->end.unsourced ? 0 : 1;
                    break;
                case type_t::token_base: {
                    auto tok = node.as<token_base_t>();
                    if (node.parent->type == type_t::begin_header &&
                        tok->type == parse_token_type_t::end) {
                        // The newline after "begin" is optional, so it is part of the header.
                        // The header is not in the indented block, so indent the newline here.
                        if (node.source(src) == L"\n") {
                            inc = 1;
                            dec = 1;
                        }
                    }
                    break;
                }
                default:
                    break;
            }

            auto range = node.source_range();
            if (range.length > 0 && node.category == category_t::leaf) {
                record_line_continuations_until(range.start);
                std::fill(indents.begin() + last_leaf_end, indents.begin() + range.start,
                          last_indent);
            }

            indent += inc;

            // If we increased the indentation, apply it to the remainder of the string, even if the
            // list is empty. For example (where _ represents the cursor):
            //
            //    if foo
            //       _
            //
            // we want to indent the newline.
            if (inc) {
                last_indent = indent;
            }

            // If this is a leaf node, apply the current indentation.
            if (node.category == category_t::leaf && range.length > 0) {
                std::fill(indents.begin() + range.start, indents.begin() + range.end(), indent);
                last_leaf_end = range.start + range.length;
                last_indent = indent;
            }

            node_visitor(*this).accept_children_of(&node);
            indent -= dec;
        }

        /// \return whether a maybe_newlines node contains at least one newline.
        bool has_newline(const maybe_newlines_t &nls) const {
            return nls.source(src).find(L'\n') != wcstring::npos;
        }

        void record_line_continuations_until(size_t offset) {
            wcstring gap_text = src.substr(last_leaf_end, offset - last_leaf_end);
            size_t escaped_nl = gap_text.find(L"\\\n");
            if (escaped_nl == wcstring::npos) return;
            auto line_end = gap_text.begin() + escaped_nl;
            if (std::find(gap_text.begin(), line_end, L'#') != line_end) return;
            auto end = src.begin() + offset;
            auto newline = src.begin() + last_leaf_end + escaped_nl + 1;
            // The gap text might contain multiple newlines if there are multiple lines that
            // don't contain an AST node, for example, comment lines, or lines containing only
            // the escaped newline.
            do {
                line_continuations.push_back(newline - src.begin());
                newline = std::find(newline + 1, end, L'\n');
            } while (newline != end);
        }

        // The one-past-the-last index of the most recently encountered leaf node.
        // We use this to populate the indents even if there's no tokens in the range.
        size_t last_leaf_end{0};

        // The last indent which we assigned.
        int last_indent{-1};

        // The source we are indenting.
        const wcstring &src;

        // List of indents, which we populate.
        std::vector<int> &indents;

        // Initialize our starting indent to -1, as our top-level node is a job list which
        // will immediately increment it.
        int indent{-1};

        // List of locations of escaped newline characters.
        std::vector<size_t> line_continuations;
    };

    indent_visitor_t iv(src, indents);
    node_visitor(iv).accept(ast.top());
    iv.record_line_continuations_until(indents.size());
    std::fill(indents.begin() + iv.last_leaf_end, indents.end(), iv.last_indent);

    // All newlines now get the *next* indent.
    // For example, in this code:
    //    if true
    //       stuff
    // the newline "belongs" to the if statement as it ends its job.
    // But when rendered, it visually belongs to the job list.

    size_t idx = src_size;
    int next_indent = iv.last_indent;
    while (idx--) {
        if (src.at(idx) == L'\n') {
            bool empty_middle_line = idx + 1 < src_size && src.at(idx + 1) == L'\n';
            if (!empty_middle_line) {
                indents.at(idx) = next_indent;
            }
        } else {
            next_indent = indents.at(idx);
        }
    }
    // Add an extra level of indentation to continuation lines.
    for (size_t idx : iv.line_continuations) {
        do {
            indents.at(idx)++;
        } while (++idx < src_size && src.at(idx) != L'\n');
    }

    return indents;
}

/// Append a syntax error to the given error list.
static bool append_syntax_error(parse_error_list_t *errors, size_t source_location,
                                const wchar_t *fmt, ...) {
    if (!errors) return true;
    parse_error_t error;
    error.source_start = source_location;
    error.source_length = 0;
    error.code = parse_error_syntax;

    va_list va;
    va_start(va, fmt);
    error.text = vformat_string(fmt, va);
    va_end(va);

    errors->push_back(std::move(error));
    return true;
}

/// Returns 1 if the specified command is a builtin that may not be used in a pipeline.
static const wchar_t *const forbidden_pipe_commands[] = {L"exec", L"case", L"break", L"return",
                                                         L"continue"};
static int parser_is_pipe_forbidden(const wcstring &word) {
    return contains(forbidden_pipe_commands, word);
}

bool parse_util_argument_is_help(const wchar_t *s) {
    return std::wcscmp(L"-h", s) == 0 || std::wcscmp(L"--help", s) == 0;
}

// \return a pointer to the first argument node of an argument_or_redirection_list_t, or nullptr if
// there are no arguments.
static const ast::argument_t *get_first_arg(const ast::argument_or_redirection_list_t &list) {
    for (const ast::argument_or_redirection_t &v : list) {
        if (v.is_argument()) return &v.argument();
    }
    return nullptr;
}

/// Given a wide character immediately after a dollar sign, return the appropriate error message.
/// For example, if wc is @, then the variable name was $@ and we suggest $argv.
static const wchar_t *error_format_for_character(wchar_t wc) {
    switch (wc) {
        case L'?': {
            return ERROR_NOT_STATUS;
        }
        case L'#': {
            return ERROR_NOT_ARGV_COUNT;
        }
        case L'@': {
            return ERROR_NOT_ARGV_AT;
        }
        case L'*': {
            return ERROR_NOT_ARGV_STAR;
        }
        case L'$':
        case VARIABLE_EXPAND:
        case VARIABLE_EXPAND_SINGLE:
        case VARIABLE_EXPAND_EMPTY: {
            return ERROR_NOT_PID;
        }
        default: {
            return ERROR_BAD_VAR_CHAR1;
        }
    }
}

void parse_util_expand_variable_error(const wcstring &token, size_t global_token_pos,
                                      size_t dollar_pos, parse_error_list_t *errors) {
    // Note that dollar_pos is probably VARIABLE_EXPAND or VARIABLE_EXPAND_SINGLE, not a literal
    // dollar sign.
    assert(errors != nullptr);
    assert(dollar_pos < token.size());
    const bool double_quotes = token.at(dollar_pos) == VARIABLE_EXPAND_SINGLE;
    const size_t start_error_count = errors->size();
    const size_t global_dollar_pos = global_token_pos + dollar_pos;
    const size_t global_after_dollar_pos = global_dollar_pos + 1;
    wchar_t char_after_dollar = dollar_pos + 1 >= token.size() ? 0 : token.at(dollar_pos + 1);

    switch (char_after_dollar) {
        case BRACE_BEGIN:
        case L'{': {
            // The BRACE_BEGIN is for unquoted, the { is for quoted. Anyways we have (possible
            // quoted) ${. See if we have a }, and the stuff in between is variable material. If so,
            // report a bracket error. Otherwise just complain about the ${.
            bool looks_like_variable = false;
            size_t closing_bracket =
                token.find(char_after_dollar == L'{' ? L'}' : wchar_t(BRACE_END), dollar_pos + 2);
            wcstring var_name;
            if (closing_bracket != wcstring::npos) {
                size_t var_start = dollar_pos + 2, var_end = closing_bracket;
                var_name = wcstring(token, var_start, var_end - var_start);
                looks_like_variable = valid_var_name(var_name);
            }
            if (looks_like_variable) {
                append_syntax_error(
                    errors, global_after_dollar_pos,
                    double_quotes ? ERROR_BRACKETED_VARIABLE_QUOTED1 : ERROR_BRACKETED_VARIABLE1,
                    truncate(var_name, var_err_len).c_str());
            } else {
                append_syntax_error(errors, global_after_dollar_pos, ERROR_BAD_VAR_CHAR1, L'{');
            }
            break;
        }
        case INTERNAL_SEPARATOR: {
            // e.g.: echo foo"$"baz
            // These are only ever quotes, not command substitutions. Command substitutions are
            // handled earlier.
            append_syntax_error(errors, global_dollar_pos, ERROR_NO_VAR_NAME);
            break;
        }
        case '(': {
            // e.g.: 'echo "foo$(bar)baz"
            // Try to determine what's in the parens.
            wcstring token_after_parens;
            wcstring paren_text;
            size_t open_parens = dollar_pos + 1, cmdsub_start = 0, cmdsub_end = 0;
            if (parse_util_locate_cmdsubst_range(token, &open_parens, &paren_text, &cmdsub_start,
                                                 &cmdsub_end, true) > 0) {
                token_after_parens = tok_first(paren_text);
            }

            // Make sure we always show something.
            if (token_after_parens.empty()) {
                token_after_parens = get_ellipsis_str();
            }

            append_syntax_error(errors, global_dollar_pos, ERROR_BAD_VAR_SUBCOMMAND1,
                                truncate(token_after_parens, var_err_len).c_str());
            break;
        }
        case L'\0': {
            append_syntax_error(errors, global_dollar_pos, ERROR_NO_VAR_NAME);
            break;
        }
        default: {
            wchar_t token_stop_char = char_after_dollar;
            // Unescape (see issue #50).
            if (token_stop_char == ANY_CHAR)
                token_stop_char = L'?';
            else if (token_stop_char == ANY_STRING || token_stop_char == ANY_STRING_RECURSIVE)
                token_stop_char = L'*';

            // Determine which error message to use. The format string may not consume all the
            // arguments we pass but that's harmless.
            const wchar_t *error_fmt = error_format_for_character(token_stop_char);

            append_syntax_error(errors, global_after_dollar_pos, error_fmt, token_stop_char);
            break;
        }
    }

    // We should have appended exactly one error.
    assert(errors->size() == start_error_count + 1);
}

/// Detect cases like $(abc). Given an arg like foo(bar), let arg_src be foo and cmdsubst_src be
/// bar. If arg ends with VARIABLE_EXPAND, then report an error.
static parser_test_error_bits_t detect_dollar_cmdsub_errors(size_t arg_src_offset,
                                                            const wcstring &arg_src,
                                                            const wcstring &cmdsubst_src,
                                                            parse_error_list_t *out_errors) {
    parser_test_error_bits_t result_bits = 0;
    wcstring unescaped_arg_src;

    if (!unescape_string(arg_src, &unescaped_arg_src, UNESCAPE_SPECIAL) ||
        unescaped_arg_src.empty()) {
        return result_bits;
    }

    wchar_t last = unescaped_arg_src.at(unescaped_arg_src.size() - 1);
    if (last == VARIABLE_EXPAND) {
        result_bits |= PARSER_TEST_ERROR;
        if (out_errors != nullptr) {
            wcstring subcommand_first_token = tok_first(cmdsubst_src);
            if (subcommand_first_token.empty()) {
                // e.g. $(). Report somthing.
                subcommand_first_token = get_ellipsis_str();
            }
            append_syntax_error(
                out_errors,
                arg_src_offset + arg_src.size() - 1,  // global position of the dollar
                ERROR_BAD_VAR_SUBCOMMAND1, truncate(subcommand_first_token, var_err_len).c_str());
        }
    }

    return result_bits;
}

/// Test if this argument contains any errors. Detected errors include syntax errors in command
/// substitutions, improperly escaped characters and improper use of the variable expansion
/// operator.
parser_test_error_bits_t parse_util_detect_errors_in_argument(const ast::argument_t &arg,
                                                              const wcstring &arg_src,
                                                              parse_error_list_t *out_errors) {
    maybe_t<source_range_t> source_range = arg.try_source_range();
    if (!source_range.has_value()) return 0;

    size_t source_start = source_range->start;
    parser_test_error_bits_t err = 0;

    size_t cursor = 0;
    wcstring subst;

    bool do_loop = true;
    while (do_loop) {
        size_t paren_begin = 0;
        size_t paren_end = 0;
        switch (parse_util_locate_cmdsubst_range(arg_src, &cursor, &subst, &paren_begin, &paren_end,
                                                 false)) {
            case -1: {
                err |= PARSER_TEST_ERROR;
                if (out_errors) {
                    append_syntax_error(out_errors, source_start, L"Mismatched parenthesis");
                }
                return err;
            }
            case 0: {
                do_loop = false;
                break;
            }
            case 1: {
                assert(paren_begin < paren_end && "Parens out of order?");
                parse_error_list_t subst_errors;
                err |= parse_util_detect_errors(subst, &subst_errors);

                // Our command substitution produced error offsets relative to its source. Tweak the
                // offsets of the errors in the command substitution to account for both its offset
                // within the string, and the offset of the node.
                size_t error_offset = paren_begin + 1 + source_start;
                parse_error_offset_source_start(&subst_errors, error_offset);

                if (out_errors != nullptr) {
                    out_errors->insert(out_errors->end(), subst_errors.begin(), subst_errors.end());

                    // Hackish. Take this opportunity to report $(...) errors. We do this because
                    // after we've replaced with internal separators, we can't distinguish between
                    // "" and (), and also we no longer have the source of the command substitution.
                    // As an optimization, this is only necessary if the last character is a $.
                    if (paren_begin > 0 && arg_src.at(paren_begin - 1) == L'$') {
                        err |= detect_dollar_cmdsub_errors(
                            source_start, arg_src.substr(0, paren_begin), subst, out_errors);
                    }
                }
                break;
            }
            default: {
                DIE("unexpected parse_util_locate_cmdsubst() return value");
            }
        }
    }

    wcstring unesc;
    if (!unescape_string(arg_src, &unesc, UNESCAPE_SPECIAL)) {
        if (out_errors) {
            append_syntax_error(out_errors, source_start, L"Invalid token '%ls'", arg_src.c_str());
        }
        return 1;
    }

    // Check for invalid variable expansions.
    const size_t unesc_size = unesc.size();
    for (size_t idx = 0; idx < unesc_size; idx++) {
        if (unesc.at(idx) != VARIABLE_EXPAND && unesc.at(idx) != VARIABLE_EXPAND_SINGLE) {
            continue;
        }

        wchar_t next_char = idx + 1 < unesc_size ? unesc.at(idx + 1) : L'\0';
        if (next_char != VARIABLE_EXPAND && next_char != VARIABLE_EXPAND_SINGLE &&
            !valid_var_name_char(next_char)) {
            err = 1;
            if (out_errors) {
                // We have something like $$$^....  Back up until we reach the first $.
                size_t first_dollar = idx;
                while (first_dollar > 0 && (unesc.at(first_dollar - 1) == VARIABLE_EXPAND ||
                                            unesc.at(first_dollar - 1) == VARIABLE_EXPAND_SINGLE)) {
                    first_dollar--;
                }
                parse_util_expand_variable_error(unesc, source_start, first_dollar, out_errors);
            }
        }
    }

    return err;
}

/// Given that the job given by node should be backgrounded, return true if we detect any errors.
static bool detect_errors_in_backgrounded_job(const ast::job_t &job,
                                              parse_error_list_t *parse_errors) {
    using namespace ast;
    auto source_range = job.try_source_range();
    if (!source_range) return false;

    bool errored = false;
    // Disallow background in the following cases:
    // foo & ; and bar
    // foo & ; or bar
    // if foo & ; end
    // while foo & ; end
    const job_conjunction_t *job_conj = job.parent->try_as<job_conjunction_t>();
    if (!job_conj) return false;

    if (job_conj->parent->try_as<if_clause_t>()) {
        errored = append_syntax_error(parse_errors, source_range->start,
                                      BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
    } else if (job_conj->parent->try_as<while_header_t>()) {
        errored = append_syntax_error(parse_errors, source_range->start,
                                      BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
    } else if (const ast::job_list_t *jlist = job_conj->parent->try_as<ast::job_list_t>()) {
        // This isn't very complete, e.g. we don't catch 'foo & ; not and bar'.
        // Find the index of ourselves in the job list.
        size_t index;
        for (index = 0; index < jlist->count(); index++) {
            if (jlist->at(index) == job_conj) break;
        }
        assert(index < jlist->count() && "Should have found the job in the list");

        // Try getting the next job and check its decorator.
        if (const job_conjunction_t *next = jlist->at(index + 1)) {
            if (const keyword_base_t *deco = next->decorator.contents.get()) {
                assert(
                    (deco->kw == parse_keyword_t::kw_and || deco->kw == parse_keyword_t::kw_or) &&
                    "Unexpected decorator keyword");
                const wchar_t *deco_name = (deco->kw == parse_keyword_t::kw_and ? L"and" : L"or");
                errored = append_syntax_error(parse_errors, deco->source_range().start,
                                              BOOL_AFTER_BACKGROUND_ERROR_MSG, deco_name);
            }
        }
    }
    return errored;
}

/// Given a source buffer \p buff_src and decorated statement \p dst within it, return true if there
/// is an error and false if not. \p storage may be used to reduce allocations.
static bool detect_errors_in_decorated_statement(const wcstring &buff_src,
                                                 const ast::decorated_statement_t &dst,
                                                 wcstring *storage,
                                                 parse_error_list_t *parse_errors) {
    using namespace ast;
    bool errored = false;
    auto source_start = dst.source_range().start;
    const statement_decoration_t decoration = dst.decoration();

    // Determine if the first argument is help.
    bool first_arg_is_help = false;
    if (const auto *arg = get_first_arg(dst.args_or_redirs)) {
        const wcstring &arg_src = arg->source(buff_src, storage);
        first_arg_is_help = parse_util_argument_is_help(arg_src.c_str());
    }

    // Get the statement we are part of.
    const statement_t *st = dst.parent->as<statement_t>();

    // Walk up to the job.
    const ast::job_t *job = nullptr;
    for (const node_t *cursor = st; job == nullptr; cursor = cursor->parent) {
        assert(cursor && "Reached root without finding a job");
        job = cursor->try_as<ast::job_t>();
    }
    assert(job && "Should have found the job");

    // Check our pipeline position.
    pipeline_position_t pipe_pos;
    if (job->continuation.empty()) {
        pipe_pos = pipeline_position_t::none;
    } else if (&job->statement == st) {
        pipe_pos = pipeline_position_t::first;
    } else {
        pipe_pos = pipeline_position_t::subsequent;
    }

    // Check that we don't try to pipe through exec.
    bool is_in_pipeline = (pipe_pos != pipeline_position_t::none);
    if (is_in_pipeline && decoration == statement_decoration_t::exec) {
        errored = append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, L"exec");
    }

    // This is a somewhat stale check that 'and' and 'or' are not in pipelines, except at the
    // beginning. We can't disallow them as commands entirely because we need to support 'and
    // --help', etc.
    if (pipe_pos == pipeline_position_t::subsequent) {
        // check if our command is 'and' or 'or'. This is very clumsy; we don't catch e.g. quoted
        // commands.
        const wcstring &command = dst.command.source(buff_src, storage);
        if (command == L"and" || command == L"or") {
            errored =
                append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, command.c_str());
        }
    }

    const wcstring &unexp_command = dst.command.source(buff_src, storage);
    if (!unexp_command.empty()) {
        wcstring command;
        // Check that we can expand the command.
        if (expand_to_command_and_args(unexp_command, operation_context_t::empty(), &command,
                                       nullptr, parse_errors,
                                       true /* skip wildcards */) == expand_result_t::error) {
            errored = true;
            parse_error_offset_source_start(parse_errors, source_start);
        }

        // Check that pipes are sound.
        if (!errored && parser_is_pipe_forbidden(command) && is_in_pipeline) {
            errored =
                append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, command.c_str());
        }

        // Check that we don't return from outside a function. But we allow it if it's
        // 'return --help'.
        if (!errored && command == L"return" && !first_arg_is_help) {
            // See if we are in a function.
            bool found_function = false;
            for (const node_t *cursor = &dst; cursor != nullptr; cursor = cursor->parent) {
                if (const auto *bs = cursor->try_as<block_statement_t>()) {
                    if (bs->header->type == type_t::function_header) {
                        found_function = true;
                        break;
                    }
                }
            }

            if (!found_function) {
                errored = append_syntax_error(parse_errors, source_start, INVALID_RETURN_ERR_MSG);
            }
        }

        // Check that we don't break or continue from outside a loop.
        if (!errored && (command == L"break" || command == L"continue") && !first_arg_is_help) {
            // Walk up until we hit a 'for' or 'while' loop. If we hit a function first,
            // stop the search; we can't break an outer loop from inside a function.
            // This is a little funny because we can't tell if it's a 'for' or 'while'
            // loop from the ancestor alone; we need the header. That is, we hit a
            // block_statement, and have to check its header.
            bool found_loop = false;
            for (const node_t *ancestor = &dst; ancestor != nullptr; ancestor = ancestor->parent) {
                const auto *block = ancestor->try_as<block_statement_t>();
                if (!block) continue;
                if (block->header->type == type_t::for_header ||
                    block->header->type == type_t::while_header) {
                    // This is a loop header, so we can break or continue.
                    found_loop = true;
                    break;
                } else if (block->header->type == type_t::function_header) {
                    // This is a function header, so we cannot break or
                    // continue. We stop our search here.
                    found_loop = false;
                    break;
                }
            }

            if (!found_loop) {
                errored = append_syntax_error(
                    parse_errors, source_start,
                    (command == L"break" ? INVALID_BREAK_ERR_MSG : INVALID_CONTINUE_ERR_MSG));
            }
        }

        // Check that we don't do an invalid builtin (issue #1252).
        if (!errored && decoration == statement_decoration_t::builtin) {
            wcstring command = unexp_command;
            if (expand_one(command, expand_flag::skip_cmdsubst, operation_context_t::empty(),
                           parse_errors) &&
                !builtin_exists(unexp_command)) {
                errored = append_syntax_error(parse_errors, source_start, UNKNOWN_BUILTIN_ERR_MSG,
                                              unexp_command.c_str());
            }
        }
    }
    return errored;
}

// Given we have a trailing argument_or_redirection_list, like `begin; end > /dev/null`, verify that
// there are no arguments in the list.
static bool detect_errors_in_block_redirection_list(
    const ast::argument_or_redirection_list_t &args_or_redirs, parse_error_list_t *out_errors) {
    if (const auto *first_arg = get_first_arg(args_or_redirs)) {
        return append_syntax_error(out_errors, first_arg->source_range().start,
                                   BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
    }
    return false;
}

parser_test_error_bits_t parse_util_detect_errors(const ast::ast_t &ast, const wcstring &buff_src,
                                                  parse_error_list_t *out_errors) {
    using namespace ast;
    parser_test_error_bits_t res = 0;

    // Whether we encountered a parse error.
    bool errored = false;

    // Whether we encountered an unclosed block. We detect this via an 'end_command' block without
    // source.
    bool has_unclosed_block = false;

    // Whether we encounter a missing statement, i.e. a newline after a pipe. This is found by
    // detecting job_continuations that have source for pipes but not the statement.
    bool has_unclosed_pipe = false;

    // Whether we encounter a missing job, i.e. a newline after && or ||. This is found by
    // detecting job_conjunction_continuations that have source for && or || but not the job.
    bool has_unclosed_conjunction = false;

    // Expand all commands.
    // Verify 'or' and 'and' not used inside pipelines.
    // Verify pipes via parser_is_pipe_forbidden.
    // Verify return only within a function.
    // Verify no variable expansions.
    wcstring storage;

    for (const node_t &node : ast) {
        if (const job_continuation_t *jc = node.try_as<job_continuation_t>()) {
            // Somewhat clumsy way of checking for a statement without source in a pipeline.
            // See if our pipe has source but our statement does not.
            if (!jc->pipe.unsourced && !jc->statement.try_source_range().has_value()) {
                has_unclosed_pipe = true;
            }
        } else if (const auto *jcc = node.try_as<job_conjunction_continuation_t>()) {
            // Somewhat clumsy way of checking for a job without source in a conjunction.
            // See if our conjunction operator (&& or ||) has source but our job does not.
            if (!jcc->conjunction.unsourced && !jcc->job.try_source_range().has_value()) {
                has_unclosed_conjunction = true;
            }
        } else if (const argument_t *arg = node.try_as<argument_t>()) {
            const wcstring &arg_src = arg->source(buff_src, &storage);
            res |= parse_util_detect_errors_in_argument(*arg, arg_src, out_errors);
        } else if (const ast::job_t *job = node.try_as<ast::job_t>()) {
            // Disallow background in the following cases:
            //
            // foo & ; and bar
            // foo & ; or bar
            // if foo & ; end
            // while foo & ; end
            // If it's not a background job, nothing to do.
            if (job->bg) {
                errored |= detect_errors_in_backgrounded_job(*job, out_errors);
            }
        } else if (const ast::decorated_statement_t *stmt = node.try_as<decorated_statement_t>()) {
            errored |= detect_errors_in_decorated_statement(buff_src, *stmt, &storage, out_errors);
        } else if (const auto *block = node.try_as<block_statement_t>()) {
            // If our 'end' had no source, we are unsourced.
            if (block->end.unsourced) has_unclosed_block = true;
            errored |= detect_errors_in_block_redirection_list(block->args_or_redirs, out_errors);
        } else if (const auto *ifs = node.try_as<if_statement_t>()) {
            // If our 'end' had no source, we are unsourced.
            if (ifs->end.unsourced) has_unclosed_block = true;
            errored |= detect_errors_in_block_redirection_list(ifs->args_or_redirs, out_errors);
        } else if (const auto *switchs = node.try_as<switch_statement_t>()) {
            // If our 'end' had no source, we are unsourced.
            if (switchs->end.unsourced) has_unclosed_block = true;
            errored |= detect_errors_in_block_redirection_list(switchs->args_or_redirs, out_errors);
        }
    }

    if (errored) res |= PARSER_TEST_ERROR;

    if (has_unclosed_block || has_unclosed_pipe || has_unclosed_conjunction)
        res |= PARSER_TEST_INCOMPLETE;

    return res;
}

parser_test_error_bits_t parse_util_detect_errors(const wcstring &buff_src,
                                                  parse_error_list_t *out_errors,
                                                  bool allow_incomplete) {
    // Whether there's an unclosed quote or subshell, and therefore unfinished. This is only set if
    // allow_incomplete is set.
    bool has_unclosed_quote_or_subshell = false;

    const parse_tree_flags_t parse_flags =
        allow_incomplete ? parse_flag_leave_unterminated : parse_flag_none;

    // Parse the input string into an ast. Some errors are detected here.
    using namespace ast;
    parse_error_list_t parse_errors;
    auto ast = ast_t::parse(buff_src, parse_flags, &parse_errors);
    if (allow_incomplete) {
        // Issue #1238: If the only error was unterminated quote, then consider this to have parsed
        // successfully.
        size_t idx = parse_errors.size();
        while (idx--) {
            if (parse_errors.at(idx).code == parse_error_tokenizer_unterminated_quote ||
                parse_errors.at(idx).code == parse_error_tokenizer_unterminated_subshell) {
                // Remove this error, since we don't consider it a real error.
                has_unclosed_quote_or_subshell = true;
                parse_errors.erase(parse_errors.begin() + idx);
            }
        }
    }

    // has_unclosed_quote_or_subshell may only be set if allow_incomplete is true.
    assert(!has_unclosed_quote_or_subshell || allow_incomplete);
    if (has_unclosed_quote_or_subshell) {
        // We do not bother to validate the rest of the tree in this case.
        return PARSER_TEST_INCOMPLETE;
    }

    // Early parse error, stop here.
    if (!parse_errors.empty()) {
        if (out_errors) vec_append(*out_errors, std::move(parse_errors));
        return PARSER_TEST_ERROR;
    }

    // Defer to the tree-walking version.
    return parse_util_detect_errors(ast, buff_src, out_errors);
}

maybe_t<wcstring> parse_util_detect_errors_in_argument_list(const wcstring &arg_list_src,
                                                            const wcstring &prefix) {
    // Helper to return a description of the first error.
    auto get_error_text = [&](const parse_error_list_t &errors) {
        assert(!errors.empty() && "Expected an error");
        return errors.at(0).describe_with_prefix(arg_list_src, prefix, false /* not interactive */,
                                                 false /* don't skip caret */);
    };

    // Parse the string as a freestanding argument list.
    using namespace ast;
    parse_error_list_t errors;
    auto ast = ast_t::parse_argument_list(arg_list_src, parse_flag_none, &errors);
    if (!errors.empty()) {
        return get_error_text(errors);
    }

    // Get the root argument list and extract arguments from it.
    // Test each of these.
    for (const argument_t &arg : ast.top()->as<freestanding_argument_list_t>()->arguments) {
        const wcstring arg_src = arg.source(arg_list_src);
        if (parse_util_detect_errors_in_argument(arg, arg_src, &errors)) {
            return get_error_text(errors);
        }
    }
    return none();
}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								// Various mostly unrelated utility functions related to parsing, loading and evaluating fish code.
 								//
 								// This library can be seen as a 'toolbox' for functions that are used in many places in fish and
 								// that are somehow related to parsing the code.
-												add (or restore) config.h to all files

The autoconf-generated config.h contains a number of directives which
may alter the behaviour of system headers on certain platforms. Always
include it in every C++ file as the first include.

Closes #2993.

											
										
										
											2016-05-19 06:30:21 +08:00
+								#include "config.h"  // IWYU pragma: keep
-												Run clang-format on all files

The main change here is to reorder headers.

											
										
										
											2019-10-14 06:50:48 +08:00
+								#include "parse_util.h"
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include <stdarg.h>
 								#include <stdlib.h>
-												lint cleanups

											
										
										
											2017-02-11 10:47:02 +08:00
-												Run clang-format on all files

The main change here is to reorder headers.

											
										
										
											2019-10-14 06:50:48 +08:00
+								#include <cwchar>
-												add better support for IWYU and fix things

Remove the "make iwyu" build target. Move the functionality into the
recently introduced lint.fish script. Fix a lot, but not all, of the
include-what-you-use errors. Specifically, it fixes all of the IWYU errors
on my OS X server but only removes some of them on my Ubuntu 14.04 server.

Fixes #2957

											
										
										
											2016-04-21 14:00:54 +08:00
+								#include <memory>
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include <string>
-												lint cleanups

											
										
										
											2017-02-11 10:47:02 +08:00
+								#include <type_traits>
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								#include "ast.h"
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include "builtin.h"
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								#include "common.h"
-												Autoloaded functions

darcs-hash:20060208092005-ac50b-8e784f79a4e158c8c15b553fad85002dccc7bd03.gz

											
										
										
											2006-02-08 17:20:05 +08:00
+								#include "expand.h"
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include "fallback.h"  // IWYU pragma: keep
-												Feature flag support for ? wildcard

This partially reverts 6e56637cf0a6036fdea4105e9f33314a3d6e8e78 and #4520
by bringing back the ? wildcard, guarded by the qmark-noglob feature flag.

											
										
										
											2018-05-06 10:11:57 +08:00
+								#include "future_feature_flags.h"
-												add better support for IWYU and fix things

Remove the "make iwyu" build target. Move the functionality into the
recently introduced lint.fish script. Fix a lot, but not all, of the
include-what-you-use errors. Specifically, it fixes all of the IWYU errors
on my OS X server but only removes some of them on my Ubuntu 14.04 server.

Fixes #2957

											
										
										
											2016-04-21 14:00:54 +08:00
+								#include "parse_constants.h"
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								#include "parse_util.h"
-												Instantize env_get_pwd_slash

This requires threading environment_t through many places, such as completions
and history. We introduce null_environment_t for when the environment isn't
important.

											
										
										
											2018-09-11 13:29:52 +08:00
+								#include "parser.h"
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include "tokenizer.h"
-												parse_util.cpp: remove truncate_string()

We already have something that does this

											
										
										
											2019-09-20 01:32:07 +08:00
+								#include "wcstringutil.h"
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								#include "wildcard.h"
 								#include "wutil.h"  // IWYU pragma: keep
-												Autoloaded functions

darcs-hash:20060208092005-ac50b-8e784f79a4e158c8c15b553fad85002dccc7bd03.gz

											
										
										
											2006-02-08 17:20:05 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Error message for use of backgrounded commands before and/or.
 								#define BOOL_AFTER_BACKGROUND_ERROR_MSG \
 								    _(L"The '%ls' command can not be used immediately after a backgrounded job")
-												Disallow backgrounding in conditionals and before and/or bool statements

Fixes #1136

											
										
										
											2014-11-03 05:11:27 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Error message for backgrounded commands as conditionals.
 								#define BACKGROUND_IN_CONDITIONAL_ERROR_MSG \
 								    _(L"Backgrounded commands can not be used as conditionals")
-												Disallow backgrounding in conditionals and before and/or bool statements

Fixes #1136

											
										
										
											2014-11-03 05:11:27 +08:00
-												Report errors for arguments to 'end'

For example, `begin ; end arg` will now report an error.

Fixes #986

											
										
										
											2018-01-23 05:31:39 +08:00
+								/// Error message for arguments to 'end'
 								#define END_ARG_ERR_MSG _(L"'end' does not take arguments. Did you forget a ';'?")
-												parse_util.cpp: remove truncate_string()

We already have something that does this

											
										
										
											2019-09-20 01:32:07 +08:00
+								/// Maximum length of a variable name to show in error reports before truncation
 								static constexpr int var_err_len = 16;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								int parse_util_lineno(const wchar_t *str, size_t offset) {
 								    if (!str) return 0;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    int res = 1;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    for (size_t i = 0; i < offset && str[i] != L'\0'; i++) {
 								        if (str[i] == L'\n') {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            res++;
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    return res;
-												Remove duplicate line counting code. Make the remaining implementation have a two element cache.

darcs-hash:20060205131035-ac50b-885c6ba87a6d16aa48dfa7ee4608ae8891c71724.gz

											
										
										
											2006-02-05 21:10:35 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								int parse_util_get_line_from_offset(const wcstring &str, size_t pos) {
-												Const correctness changes

											
										
										
											2012-02-06 16:57:43 +08:00
+								    const wchar_t *buff = str.c_str();
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    int count = 0;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    for (size_t i = 0; i < pos; i++) {
 								        if (!buff[i]) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            return -1;
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (buff[i] == L'\n') {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            count++;
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    return count;
-												Make up/down cursor move up or down when in multiline mode, except if already in search mode or at the top/bottom line. Since part of this is done in script-space, this involves adding some functionality to the commandline builtin.

darcs-hash:20070921140549-75c98-ba9e83f5e6fdecae5df8f83dd863794c6af9770c.gz

											
										
										
											2007-09-21 22:05:49 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								size_t parse_util_get_offset_from_line(const wcstring &str, int line) {
-												Const correctness changes

											
										
										
											2012-02-06 16:57:43 +08:00
+								    const wchar_t *buff = str.c_str();
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    size_t i;
 								    int count = 0;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								    if (line < 0) return static_cast<size_t>(-1);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (line == 0) return 0;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    for (i = 0;; i++) {
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								        if (!buff[i]) return static_cast<size_t>(-1);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (buff[i] == L'\n') {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            count++;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            if (count == line) {
-												Teach up-line to cross empty lines

The line offset of a trailing newline on the commandline was computed incorrectly.
As a result, up-arrow did not work for a commandline like the one inserted by:

	commandline -i echo '' ''

Note this and the previous commit in the changelog.

											
										
										
											2020-08-29 17:07:12 +08:00
+								                return i + 1;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            }
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												Make up/down cursor move up or down when in multiline mode, except if already in search mode or at the top/bottom line. Since part of this is done in script-space, this involves adding some functionality to the commandline builtin.

darcs-hash:20070921140549-75c98-ba9e83f5e6fdecae5df8f83dd863794c6af9770c.gz

											
										
										
											2007-09-21 22:05:49 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								size_t parse_util_get_offset(const wcstring &str, int line, long line_offset) {
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    size_t off = parse_util_get_offset_from_line(str, line);
 								    size_t off2 = parse_util_get_offset_from_line(str, line + 1);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								    if (off == static_cast<size_t>(-1)) return static_cast<size_t>(-1);
 								    if (off2 == static_cast<size_t>(-1)) off2 = str.length() + 1;
-												lint cleanup: parameter reassignment

											
										
										
											2016-10-21 09:53:31 +08:00
+								    if (line_offset < 0) line_offset = 0;  //!OCLINT(parameter reassignment)
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								    if (static_cast<size_t>(line_offset) >= off2 - off - 1) {
-												lint cleanup: parameter reassignment

											
										
										
											2016-10-21 09:53:31 +08:00
+								        line_offset = off2 - off - 1;  //!OCLINT(parameter reassignment)
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												eliminate signed/unsigned comparison warnings

This partially addresses #3430.

											
										
										
											2016-10-10 05:36:08 +08:00
+								    return off + line_offset;
-												Make up/down cursor move up or down when in multiline mode, except if already in search mode or at the top/bottom line. Since part of this is done in script-space, this involves adding some functionality to the commandline builtin.

darcs-hash:20070921140549-75c98-ba9e83f5e6fdecae5df8f83dd863794c6af9770c.gz

											
										
										
											2007-09-21 22:05:49 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								static int parse_util_locate_brackets_of_type(const wchar_t *in, wchar_t **begin, wchar_t **end,
 								                                              bool allow_incomplete, wchar_t open_type,
 								                                              wchar_t close_type) {
 								    // open_type is typically ( or [, and close type is the corresponding value.
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    wchar_t *pos;
-												Handle backslashes properly in locate_brackets_of_type

This needs to be rewritten, I'm pretty sure we have like 6 of these
kinds of ad-hoc "is this quoted" things lying around.

But for now, at least don't just check if the *previous* character was
a backslash.

Fixes #7685.

											
										
										
											2021-02-06 05:00:31 +08:00
+								    bool escaped = false;
-												Use bools, we have the technology

											
										
										
											2020-09-24 23:21:49 +08:00
+								    bool syntax_error = false;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    int paran_count = 0;
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    wchar_t *paran_begin = nullptr, *paran_end = nullptr;
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												Eliminate the CHECK() macro

This thing was pretty useless.

											
										
										
											2019-05-28 08:24:19 +08:00
+								    assert(in && "null parameter");
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    for (pos = const_cast<wchar_t *>(in); *pos; pos++) {
-												Handle backslashes properly in locate_brackets_of_type

This needs to be rewritten, I'm pretty sure we have like 6 of these
kinds of ad-hoc "is this quoted" things lying around.

But for now, at least don't just check if the *previous* character was
a backslash.

Fixes #7685.

											
										
										
											2021-02-06 05:00:31 +08:00
+								        if (!escaped) {
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								            if (std::wcschr(L"\'\"", *pos)) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                wchar_t *q_end = quote_end(pos);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                if (q_end && *q_end) {
 								                    pos = q_end;
 								                } else {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                    break;
 								                }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            } else {
 								                if (*pos == open_type) {
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								                    if ((paran_count == 0) && (paran_begin == nullptr)) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                        paran_begin = pos;
 								                    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                    paran_count++;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                } else if (*pos == close_type) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                    paran_count--;
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								                    if ((paran_count == 0) && (paran_end == nullptr)) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                        paran_end = pos;
 								                        break;
 								                    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                    if (paran_count < 0) {
-												Use bools, we have the technology

											
										
										
											2020-09-24 23:21:49 +08:00
+								                        syntax_error = true;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                        break;
 								                    }
 								                }
 								            }
 								        }
-												Handle backslashes properly in locate_brackets_of_type

This needs to be rewritten, I'm pretty sure we have like 6 of these
kinds of ad-hoc "is this quoted" things lying around.

But for now, at least don't just check if the *previous* character was
a backslash.

Fixes #7685.

											
										
										
											2021-02-06 05:00:31 +08:00
+								        if (*pos == '\\') {
 								            escaped = !escaped;
 								        } else {
 								            escaped = false;
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    syntax_error |= (paran_count < 0);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    syntax_error |= ((paran_count > 0) && (!allow_incomplete));
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (syntax_error) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        return -1;
 								    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    if (paran_begin == nullptr) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        return 0;
 								    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (begin) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        *begin = paran_begin;
 								    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (end) {
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								        *end = paran_count ? const_cast<wchar_t *>(in) + std::wcslen(in) : paran_end;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    }
-												Run restyle.sh to enforce style rules.

											
										
										
											2014-04-01 01:01:39 +08:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    return 1;
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								int parse_util_locate_cmdsubst(const wchar_t *in, wchar_t **begin, wchar_t **end,
 								                               bool accept_incomplete) {
-												Highlight the entire variable name, not just the dollar sign. Fixes #1201

											
										
										
											2014-02-04 06:13:42 +08:00
+								    return parse_util_locate_brackets_of_type(in, begin, end, accept_incomplete, L'(', L')');
 								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								int parse_util_locate_slice(const wchar_t *in, wchar_t **begin, wchar_t **end,
 								                            bool accept_incomplete) {
-												Highlight the entire variable name, not just the dollar sign. Fixes #1201

											
										
										
											2014-02-04 06:13:42 +08:00
+								    return parse_util_locate_brackets_of_type(in, begin, end, accept_incomplete, L'[', L']');
 								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								static int parse_util_locate_brackets_range(const wcstring &str, size_t *inout_cursor_offset,
 								                                            wcstring *out_contents, size_t *out_start,
 								                                            size_t *out_end, bool accept_incomplete,
 								                                            wchar_t open_type, wchar_t close_type) {
 								    // Clear the return values.
-												fix incorrectly aligned carat in command expansion errors and more

- fix the carat position expanding e.g. `command $,`
- improve the error reporting for not-allowed command subtitutions
  by figuring out where the expansion failed instead of using
  SOURCE_LOCATION_UNKNOWN
- allow nullptr for parse_util_licate_brackets_range() out_string
  argument if we don't need it to do any work.

Fixes #5812

											
										
										
											2019-04-12 05:28:27 +08:00
+								    if (out_contents != nullptr) out_contents->clear();
-												Syntax highlighting for command substitutions

											
										
										
											2013-10-09 09:41:35 +08:00
+								    *out_start = 0;
 								    *out_end = str.size();
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Nothing to do if the offset is at or past the end of the string.
 								    if (*inout_cursor_offset >= str.size()) return 0;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Defer to the wonky version.
 								    const wchar_t *const buff = str.c_str();
 								    const wchar_t *const valid_range_start = buff + *inout_cursor_offset,
 								                         *valid_range_end = buff + str.size();
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    wchar_t *bracket_range_begin = nullptr, *bracket_range_end = nullptr;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    int ret = parse_util_locate_brackets_of_type(valid_range_start, &bracket_range_begin,
 								                                                 &bracket_range_end, accept_incomplete, open_type,
 								                                                 close_type);
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								    if (ret <= 0) {
 								        return ret;
-												Syntax highlighting for command substitutions

											
										
										
											2013-10-09 09:41:35 +08:00
+								    }
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
 								    // The command substitutions must not be NULL and must be in the valid pointer range, and
 								    // the end must be bigger than the beginning.
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    assert(bracket_range_begin != nullptr && bracket_range_begin >= valid_range_start &&
-												time for another `make style-all`

											
										
										
											2016-12-04 12:12:53 +08:00
+								           bracket_range_begin <= valid_range_end);
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    assert(bracket_range_end != nullptr && bracket_range_end > bracket_range_begin &&
-												time for another `make style-all`

											
										
										
											2016-12-04 12:12:53 +08:00
+								           bracket_range_end >= valid_range_start && bracket_range_end <= valid_range_end);
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
 								    // Assign the substring to the out_contents.
 								    const wchar_t *interior_begin = bracket_range_begin + 1;
-												fix incorrectly aligned carat in command expansion errors and more

- fix the carat position expanding e.g. `command $,`
- improve the error reporting for not-allowed command subtitutions
  by figuring out where the expansion failed instead of using
  SOURCE_LOCATION_UNKNOWN
- allow nullptr for parse_util_licate_brackets_range() out_string
  argument if we don't need it to do any work.

Fixes #5812

											
										
										
											2019-04-12 05:28:27 +08:00
+								    if (out_contents != nullptr) {
 								        out_contents->assign(interior_begin, bracket_range_end - interior_begin);
 								    }
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
 								    // Return the start and end.
 								    *out_start = bracket_range_begin - buff;
 								    *out_end = bracket_range_end - buff;
 								    // Update the inout_cursor_offset. Note this may cause it to exceed str.size(), though
 								    // overflow is not likely.
 								    *inout_cursor_offset = 1 + *out_end;
-												Syntax highlighting for command substitutions

											
										
										
											2013-10-09 09:41:35 +08:00
+								    return ret;
 								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								int parse_util_locate_cmdsubst_range(const wcstring &str, size_t *inout_cursor_offset,
 								                                     wcstring *out_contents, size_t *out_start, size_t *out_end,
 								                                     bool accept_incomplete) {
 								    return parse_util_locate_brackets_range(str, inout_cursor_offset, out_contents, out_start,
 								                                            out_end, accept_incomplete, L'(', L')');
-												Highlight the entire variable name, not just the dollar sign. Fixes #1201

											
										
										
											2014-02-04 06:13:42 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_cmdsubst_extent(const wchar_t *buff, size_t cursor_pos, const wchar_t **a,
 								                                const wchar_t **b) {
-												Eliminate the CHECK() macro

This thing was pretty useless.

											
										
										
											2019-05-28 08:24:19 +08:00
+								    assert(buff && "Null buffer");
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    const wchar_t *const cursor = buff + cursor_pos;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								    const size_t bufflen = std::wcslen(buff);
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								    assert(cursor_pos <= bufflen);
-												Improvements to new parser. All functions and completions now parse.

											
										
										
											2013-07-23 09:26:15 +08:00
-												Amend typos and grammar errors

											
										
										
											2019-11-25 19:03:25 +08:00
+								    // ap and bp are the beginning and end of the tightest command substitution found so far.
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								    const wchar_t *ap = buff, *bp = buff + bufflen;
 								    const wchar_t *pos = buff;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    for (;;) {
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								        wchar_t *begin = nullptr, *end = nullptr;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (parse_util_locate_cmdsubst(pos, &begin, &end, true) <= 0) {
 								            // No subshell found, all done.
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        // Interpret NULL to mean the end.
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								        if (end == nullptr) {
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								            end = const_cast<wchar_t *>(buff) + bufflen;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        }
-												Improvements to new parser. All functions and completions now parse.

											
										
										
											2013-07-23 09:26:15 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (begin < cursor && end >= cursor) {
 								            // This command substitution surrounds the cursor, so it's a tighter fit.
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            begin++;
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								            ap = begin;
 								            bp = end;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            // pos is where to begin looking for the next one. But if we reached the end there's no
 								            // next one.
 								            if (begin >= end) break;
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								            pos = begin + 1;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else if (begin >= cursor) {
 								            // This command substitution starts at or after the cursor. Since it was the first
 								            // command substitution in the string, we're done.
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            break;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else {
 								            // This command substitution ends before the cursor. Skip it.
-												Make parse_util_locate_cmdsubst return the innermost command substitution instead of the outermost.
Fixes https://github.com/fish-shell/fish-shell/issues/913

											
										
										
											2013-07-17 16:35:30 +08:00
+								            assert(end < cursor);
 								            pos = end + 1;
 								            assert(pos <= buff + bufflen);
 								        }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    }
-												Improvements to new parser. All functions and completions now parse.

											
										
										
											2013-07-23 09:26:15 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    if (a != nullptr) *a = ap;
 								    if (b != nullptr) *b = bp;
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Get the beginning and end of the job or process definition under the cursor.
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								static void job_or_process_extent(bool process, const wchar_t *buff, size_t cursor_pos,
 								                                  const wchar_t **a, const wchar_t **b,
 								                                  std::vector<tok_t> *tokens) {
-												Eliminate the CHECK() macro

This thing was pretty useless.

											
										
										
											2019-05-28 08:24:19 +08:00
+								    assert(buff && "Null buffer");
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								    const wchar_t *begin = nullptr, *end = nullptr;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    int finished = 0;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								    if (a) *a = nullptr;
 								    if (b) *b = nullptr;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    parse_util_cmdsubst_extent(buff, cursor_pos, &begin, &end);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (!end || !begin) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        return;
 								    }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Change C casts to C++ ones

Some were kept for compatibility.

Found with -Wold-style-cast

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2020-04-09 07:56:59 +08:00
+								    assert(cursor_pos >= static_cast<size_t>(begin - buff));
-												Continue migration to the new tokenizer interface

											
										
										
											2015-07-26 15:12:36 +08:00
+								    const size_t pos = cursor_pos - (begin - buff);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (a) *a = begin;
 								    if (b) *b = end;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								    const wcstring buffcpy(begin, end);
 								    tokenizer_t tok(buffcpy.c_str(), TOK_ACCEPT_UNFINISHED);
 								    maybe_t<tok_t> token{};
 								    while ((token = tok.next()) && !finished) {
 								        size_t tok_begin = token->offset;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								        switch (token->type) {
 								            case token_type_t::pipe: {
 								                if (!process) {
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                    break;
 								                }
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								            }
 								            /* FALLTHROUGH */
 								            case token_type_t::end:
 								            case token_type_t::background:
 								            case token_type_t::andand:
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								            case token_type_t::oror:
 								            case token_type_t::comment: {
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								                if (tok_begin >= pos) {
 								                    finished = 1;
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								                    if (b) *b = const_cast<wchar_t *>(begin) + tok_begin;
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								                } else {
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								                    // Statement at cursor might start after this token.
-												[clang-tidy] Convert C casts to C++ ones

Found with google-readability-casting

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 09:08:16 +08:00
+								                    if (a) *a = const_cast<wchar_t *>(begin) + tok_begin + token->length;
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								                    if (tokens) tokens->clear();
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                }
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								                continue;  // Do not add this to tokens
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								            }
 								            default: {
 								                break;
-												Reformat all files

This runs build_tools/style.fish, which runs clang-format on C++, fish_indent on fish and (new) black on python.

If anything is wrong with the formatting, we should fix the tools, but automated formatting is worth it.

											
										
										
											2019-05-05 18:09:25 +08:00
+								            }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								        }
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								        if (tokens) tokens->push_back(*token);
-												Clean up job_or_process_extent

This had a bad merge which happened to work, plus some other nonsense.

											
										
										
											2019-10-19 06:24:28 +08:00
+								    }
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_process_extent(const wchar_t *buff, size_t pos, const wchar_t **a,
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								                               const wchar_t **b, std::vector<tok_t> *tokens) {
 								    job_or_process_extent(true, buff, pos, a, b, tokens);
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_job_extent(const wchar_t *buff, size_t pos, const wchar_t **a, const wchar_t **b) {
-												Fix completion for builtins (with subcommands)

Presently the completion engine ignores builtins that are part of the
fish syntax. This can be a problem when completing a string that was
based on the output of `commandline -p`.  This changes completions to
treat these builtins like any other command.

This also disables generic (filename) completion inside comments and
after strings that do not tokenize.

Additionally, comments are stripped off the output of `commandline -p`.

Fixes #5415
Fixes #2705

											
										
										
											2019-10-29 20:32:26 +08:00
+								    job_or_process_extent(false, buff, pos, a, b, nullptr);
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_token_extent(const wchar_t *buff, size_t cursor_pos, const wchar_t **tok_begin,
 								                             const wchar_t **tok_end, const wchar_t **prev_begin,
 								                             const wchar_t **prev_end) {
-												Eliminate the CHECK() macro

This thing was pretty useless.

											
										
										
											2019-05-28 08:24:19 +08:00
+								    assert(buff && "Null buffer");
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    const wchar_t *a = nullptr, *b = nullptr, *pa = nullptr, *pb = nullptr;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								    const wchar_t *cmdsubst_begin, *cmdsubst_end;
 								    parse_util_cmdsubst_extent(buff, cursor_pos, &cmdsubst_begin, &cmdsubst_end);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (!cmdsubst_end || !cmdsubst_begin) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        return;
 								    }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // pos is equivalent to cursor_pos within the range of the command substitution {begin, end}.
-												eliminate signed/unsigned comparison warnings

This partially addresses #3430.

											
										
										
											2016-10-10 05:36:08 +08:00
+								    size_t offset_within_cmdsubst = cursor_pos - (cmdsubst_begin - buff);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								    size_t bufflen = std::wcslen(buff);
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								    a = cmdsubst_begin + offset_within_cmdsubst;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    b = a;
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								    pa = cmdsubst_begin + offset_within_cmdsubst;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    pb = pa;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								    assert(cmdsubst_begin >= buff);
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    assert(cmdsubst_begin <= (buff + bufflen));
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								    assert(cmdsubst_end >= cmdsubst_begin);
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    assert(cmdsubst_end <= (buff + bufflen));
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    const wcstring buffcpy = wcstring(cmdsubst_begin, cmdsubst_end - cmdsubst_begin);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Rationalize how the parser reports tokenizer errors

Remove the unnecessary SQUASH_ERROR flag and correctly report errors
generated from the tokenizer.

											
										
										
											2018-02-24 09:28:12 +08:00
+								    tokenizer_t tok(buffcpy.c_str(), TOK_ACCEPT_UNFINISHED);
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								    while (maybe_t<tok_t> token = tok.next()) {
 								        size_t tok_begin = token->offset;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        size_t tok_end = tok_begin;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        // Calculate end of token.
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								        if (token->type == token_type_t::string) {
 								            tok_end += token->length;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        // Cursor was before beginning of this token, means that the cursor is between two tokens,
 								        // so we set it to a zero element string and break.
 								        if (tok_begin > offset_within_cmdsubst) {
-												Fix for parse_util_token_extent doing the wrong thing inside a command
substitution. Fixes https://github.com/fish-shell/fish-shell/issues/833

											
										
										
											2013-09-22 07:38:57 +08:00
+								            a = b = cmdsubst_begin + offset_within_cmdsubst;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        // If cursor is inside the token, this is the token we are looking for. If so, set a and b
 								        // and break.
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								        if (token->type == token_type_t::string && tok_end >= offset_within_cmdsubst) {
 								            a = cmdsubst_begin + token->offset;
 								            b = a + token->length;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        // Remember previous string token.
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								        if (token->type == token_type_t::string) {
 								            pa = cmdsubst_begin + token->offset;
 								            pb = pa + token->length;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (tok_begin) *tok_begin = a;
 								    if (tok_end) *tok_end = b;
 								    if (prev_begin) *prev_begin = pa;
 								    if (prev_end) *prev_end = pb;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    assert(pa >= buff);
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    assert(pa <= (buff + bufflen));
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    assert(pb >= pa);
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    assert(pb <= (buff + bufflen));
-												Add support for calculating completions for arbitrary commands through the 'complete' builtin

darcs-hash:20060130165150-ac50b-5e2ef3bb0298dd5e1a5d6fbdade314cc73ef36f3.gz

											
										
										
											2006-01-31 00:51:50 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								wcstring parse_util_unescape_wildcards(const wcstring &str) {
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								    wcstring result;
 								    result.reserve(str.size());
-												Add a feature_test() function

This is a convenience over fish_features().test()

											
										
										
											2018-05-06 10:44:57 +08:00
+								    bool unesc_qmark = !feature_test(features_t::qmark_noglob);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								    const wchar_t *const cs = str.c_str();
 								    for (size_t i = 0; cs[i] != L'\0'; i++) {
 								        if (cs[i] == L'*') {
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								            result.push_back(ANY_STRING);
-												Feature flag support for ? wildcard

This partially reverts 6e56637cf0a6036fdea4105e9f33314a3d6e8e78 and #4520
by bringing back the ? wildcard, guarded by the qmark-noglob feature flag.

											
										
										
											2018-05-06 10:11:57 +08:00
+								        } else if (cs[i] == L'?' && unesc_qmark) {
 								            result.push_back(ANY_CHAR);
-												Remove support for the ? wildcard

Fixes #4520

											
										
										
											2018-04-01 07:48:57 +08:00
+								        } else if (cs[i] == L'\\' && cs[i + 1] == L'*') {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            result.push_back(cs[i + 1]);
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								            i += 1;
-												Feature flag support for ? wildcard

This partially reverts 6e56637cf0a6036fdea4105e9f33314a3d6e8e78 and #4520
by bringing back the ? wildcard, guarded by the qmark-noglob feature flag.

											
										
										
											2018-05-06 10:11:57 +08:00
+								        } else if (cs[i] == L'\\' && cs[i + 1] == L'?' && unesc_qmark) {
 								            result.push_back(cs[i + 1]);
 								            i += 1;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else if (cs[i] == L'\\' && cs[i + 1] == L'\\') {
 								            // Not a wildcard, but ensure the next iteration doesn't see this escaped backslash.
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								            result.append(L"\\\\");
 								            i += 1;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else {
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								            result.push_back(cs[i]);
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								        }
 								    }
-												Rewrite parse_util_unescape_wildcards

Make it simpler, and use wcstring instead of wcsdup

											
										
										
											2015-08-20 02:35:24 +08:00
+								    return result;
-												Make sure that command specific completions can handle input strings with wildcards reasonably well

darcs-hash:20060219011432-ac50b-89a73a3d414f2dbd8a213b851fcb1c494e022eae.gz

											
										
										
											2006-02-19 09:14:32 +08:00
+								}
-												Add support for sending arguments whenusing the source builtin

darcs-hash:20060214195636-ac50b-511c211368103df6923d63cef99ce20a88d31be3.gz

											
										
										
											2006-02-15 03:56:36 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Find the outermost quoting style of current token. Returns 0 if token is not quoted.
 								static wchar_t get_quote(const wcstring &cmd_str, size_t len) {
 								    size_t i = 0;
 								    wchar_t res = 0;
 								    const wchar_t *const cmd = cmd_str.c_str();
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												[clang-tidy] Use bool literals

Found with modernize-use-bool-literals

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-26 08:36:13 +08:00
+								    while (true) {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (!cmd[i]) break;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (cmd[i] == L'\\') {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            i++;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            if (!cmd[i]) break;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            i++;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else {
 								            if (cmd[i] == L'\'' || cmd[i] == L'\"') {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                const wchar_t *end = quote_end(&cmd[i]);
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								                // std::fwprintf( stderr, L"Jump %d\n",  end-cmd );
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								                if ((end == nullptr) || (!*end) || (end > cmd + len)) {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                    res = cmd[i];
 								                    break;
 								                }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                i = end - cmd + 1;
 								            } else
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								                i++;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								        }
 								    }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    return res;
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_get_parameter_info(const wcstring &cmd, const size_t pos, wchar_t *quote,
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								                                   size_t *offset, token_type_t *out_type) {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    size_t prev_pos = 0;
-												fix bug introduced by 42458ff7

There was one block of code modified by commit 42458ff7 that had
convoluted, inverted, logic. In the process of collapsing nested
"if" blocks the logic was modified to avoid using "!" everywhere the
bool was tested. Unfortunately I neglected to modify two of the
conditions used to set that var to reflect the changed polarity.

											
										
										
											2016-10-25 08:13:39 +08:00
+								    wchar_t last_quote = L'\0';
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												Rationalize how the parser reports tokenizer errors

Remove the unnecessary SQUASH_ERROR flag and correctly report errors
generated from the tokenizer.

											
										
										
											2018-02-24 09:28:12 +08:00
+								    tokenizer_t tok(cmd.c_str(), TOK_ACCEPT_UNFINISHED);
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								    while (auto token = tok.next()) {
 								        if (token->offset > pos) break;
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								        if (token->type == token_type_t::string)
 								            last_quote = get_quote(tok.text_of(*token), pos - token->offset);
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								        if (out_type != nullptr) *out_type = token->type;
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
-												Clean up some tokenization

Remove TOK_NONE
Turn token_type into an enum class
Make next() turn a maybe_t<tok_t> instead of a bool

											
										
										
											2019-10-14 07:06:16 +08:00
+								        prev_pos = token->offset;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								    }
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
 								    wchar_t *cmd_tmp = wcsdup(cmd.c_str());
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    cmd_tmp[pos] = 0;
-												parse_util: Remove some wcharisms

											
										
										
											2018-10-21 04:25:55 +08:00
+								    size_t cmdlen = pos;
-												fix bug introduced by 42458ff7

There was one block of code modified by commit 42458ff7 that had
convoluted, inverted, logic. In the process of collapsing nested
"if" blocks the logic was modified to avoid using "!" everywhere the
bool was tested. Unfortunately I neglected to modify two of the
conditions used to set that var to reflect the changed polarity.

											
										
										
											2016-10-25 08:13:39 +08:00
+								    bool finished = cmdlen != 0;
-												lint: "collapsible if statements" warnings

											
										
										
											2016-10-23 02:21:13 +08:00
+								    if (finished) {
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								        finished = (quote == nullptr);
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								        if (finished && std::wcschr(L" \t\n\r", cmd_tmp[cmdlen - 1])) {
-												fix bug introduced by 42458ff7

There was one block of code modified by commit 42458ff7 that had
convoluted, inverted, logic. In the process of collapsing nested
"if" blocks the logic was modified to avoid using "!" everywhere the
bool was tested. Unfortunately I neglected to modify two of the
conditions used to set that var to reflect the changed polarity.

											
										
										
											2016-10-25 08:13:39 +08:00
+								            finished = cmdlen > 1 && cmd_tmp[cmdlen - 2] == L'\\';
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								        }
 								    }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (quote) *quote = last_quote;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    if (offset != nullptr) {
-												lint: "collapsible if statements" warnings

											
										
										
											2016-10-23 02:21:13 +08:00
+								        if (finished) {
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								            while ((cmd_tmp[prev_pos] != 0) && (std::wcschr(L";|", cmd_tmp[prev_pos]) != nullptr))
-												Reformat all files

This runs build_tools/style.fish, which runs clang-format on C++, fish_indent on fish and (new) black on python.

If anything is wrong with the formatting, we should fix the tools, but automated formatting is worth it.

											
										
										
											2019-05-05 18:09:25 +08:00
+								                prev_pos++;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            *offset = prev_pos;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        } else {
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 08:30:30 +08:00
+								            *offset = pos;
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 18:23:22 +08:00
+								    }
-												lint: "collapsible if statements" warnings

											
										
										
											2016-10-23 02:21:13 +08:00
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
+								    free(cmd_tmp);
 								}
-												Teach parse_util_escape_string_with_quote about tildes

Properly escape literal tildes in tab completion results. Currently we
always escape tildes in unquoted arguments; in the future we may escape
only leading tildes.

Fixes #2274

											
										
										
											2018-02-18 06:36:43 +08:00
+								wcstring parse_util_escape_string_with_quote(const wcstring &cmd, wchar_t quote, bool no_tilde) {
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
+								    wcstring result;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (quote == L'\0') {
-												Revert "Escape separators (colon and equals) to improve completion"

This reverts commit f7dac82ed601135754d0c65536f79d07d83e9fae from pull
request #6059.

As discussed in #6099, this caused a regression in some completions (eg
dd).

											
										
										
											2019-09-19 14:32:40 +08:00
+								        escape_flags_t flags = ESCAPE_ALL | ESCAPE_NO_QUOTED | (no_tilde ? ESCAPE_NO_TILDE : 0);
-												Teach parse_util_escape_string_with_quote about tildes

Properly escape literal tildes in tab completion results. Currently we
always escape tildes in unquoted arguments; in the future we may escape
only leading tildes.

Fixes #2274

											
										
										
											2018-02-18 06:36:43 +08:00
+								        result = escape_string(cmd, flags);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    } else {
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								        // Here we are going to escape a string with quotes.
 								        // A few characters cannot be represented inside quotes, e.g. newlines. In that case,
 								        // terminate the quote and then re-enter it.
 								        result.reserve(cmd.size());
 								        for (wchar_t c : cmd) {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            switch (c) {
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                case L'\n':
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								                    result.append({quote, L'\\', L'n', quote});
 								                    break;
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                case L'\t':
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								                    result.append({quote, L'\\', L't', quote});
 								                    break;
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                case L'\b':
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								                    result.append({quote, L'\\', L'b', quote});
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                    break;
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								                case L'\r':
 								                    result.append({quote, L'\\', L'r', quote});
 								                    break;
 								                case L'\\':
 								                    result.append({L'\\', L'\\'});
 								                    break;
-												Escape literal dollar signs in quoted completions

Closes #6060.

											
										
										
											2019-08-24 16:31:36 +08:00
+								                case L'$':
 								                    if (quote == L'"') result.push_back(L'\\');
 								                    result.push_back(L'$');
 								                    break;
-												Correct handling of unescapable entities in quotes

Prior to this fix, if you attempt to complete from inside a quote and the
completion contained an entity that cannot be represented inside quotes
(i.e. \n \r \t \b), the result would be a broken mess of quotes. Rewrite
the implementation so that it exits the quotes, emits the correct unquoted
escape, and then re-enters the quotes.

											
										
										
											2018-02-18 07:04:31 +08:00
+								                default:
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                    if (c == quote) result.push_back(L'\\');
-												Fix indentation of switch statements

											
										
										
											2012-11-19 16:31:03 +08:00
+								                    result.push_back(c);
 								                    break;
-												Untangle unescaping responsibilities in highlight.cpp. Fix cd autosuggestions to properly handle quotes. Factor out some of the quote unescaping behavior from reader.cpp to parse_util.cpp.
Add some autosuggestion tests

											
										
										
											2012-07-07 05:34:53 +08:00
+								            }
 								        }
 								    }
 								    return result;
 								}
-												Rewriting indenting functionality to use new parser

											
										
										
											2013-12-09 05:41:12 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								std::vector<int> parse_util_compute_indents(const wcstring &src) {
 								    // Make a vector the same size as the input string, which contains the indents. Initialize them
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								    // to 0.
-												Rewriting indenting functionality to use new parser

											
										
										
											2013-12-09 05:41:12 +08:00
+								    const size_t src_size = src.size();
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								    std::vector<int> indents(src_size, 0);
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												Optimize parse_util_compute_indents

Exploit the fact that most input strings will not contain newlines,
in which case we do not have to parse anything.

											
										
										
											2020-03-03 17:24:05 +08:00
+								    // Simple trick: if our source does not contain a newline, then all indents are 0.
 								    if (src.find('\n') == wcstring::npos) {
 								        return indents;
 								    }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Parse the string. We pass continue_after_error to produce a forest; the trailing indent of
 								    // the last node we visited becomes the input indent of the next. I.e. in the case of 'switch
 								    // foo ; cas', we get an invalid parse tree (since 'cas' is not valid) but we indent it as if it
 								    // were a case item list.
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								    using namespace ast;
 								    auto ast =
 								        ast_t::parse(src, parse_flag_continue_after_error | parse_flag_include_comments |
 								                              parse_flag_accept_incomplete_tokens | parse_flag_leave_unterminated);
 								    // Visit all of our nodes. When we get a job_list or case_item_list, increment indent while
 								    // visiting its children.
 								    struct indent_visitor_t {
-												Indent continuations after | and &&

This indents continuations after pipes and conjunctions if they contain
a newline.

Example:

    cmd1 &&
        cmd2

But it avoids the "double indent" if it indented unconditionally:

    cmd1 | begin
        cmd2
    end

More work towards improving #7252

											
										
										
											2020-08-10 03:15:14 +08:00
+								        indent_visitor_t(const wcstring &src, std::vector<int> &indents)
 								            : src(src), indents(indents) {}
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
 								        void visit(const node_t &node) {
 								            int inc = 0;
 								            int dec = 0;
 								            switch (node.type) {
 								                case type_t::job_list:
 								                case type_t::andor_job_list:
 								                    // Job lists are never unwound.
 								                    inc = 1;
 								                    dec = 1;
 								                    break;
 								                // Increment indents for conditions in headers (#1665).
 								                case type_t::job_conjunction:
 								                    if (node.parent->type == type_t::while_header ||
 								                        node.parent->type == type_t::if_clause) {
 								                        inc = 1;
 								                        dec = 1;
 								                    }
 								                    break;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												Indent continuations after | and &&

This indents continuations after pipes and conjunctions if they contain
a newline.

Example:

    cmd1 &&
        cmd2

But it avoids the "double indent" if it indented unconditionally:

    cmd1 | begin
        cmd2
    end

More work towards improving #7252

											
										
										
											2020-08-10 03:15:14 +08:00
+								                // Increment indents for job_continuation_t if it contains a newline.
 								                // This is a bit of a hack - it indents cases like:
 								                //    cmd1 |
 								                //    ....cmd2
 								                // but avoids "double indenting" if there's no newline:
 								                //   cmd1 | while cmd2
 								                //   ....cmd3
 								                //   end
 								                // See #7252.
 								                case type_t::job_continuation:
 								                    if (has_newline(node.as<job_continuation_t>()->newlines)) {
 								                        inc = 1;
 								                        dec = 1;
 								                    }
 								                    break;
 								                // Likewise for && and ||.
 								                case type_t::job_conjunction_continuation:
 								                    if (has_newline(node.as<job_conjunction_continuation_t>()->newlines)) {
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								                        inc = 1;
 								                        dec = 1;
 								                    }
 								                    break;
 								                case type_t::case_item_list:
 								                    // Here's a hack. Consider:
 								                    // switch abc
 								                    //    cas
 								                    //
 								                    // fish will see that 'cas' is not valid inside a switch statement because it is
 								                    // not "case". It will then unwind back to the top level job list, producing a
 								                    // parse tree like:
 								                    //
 								                    //   job_list
 								                    //      switch_job
 								                    //         <err>
 								                    //      normal_job
 								                    //         cas
 								                    //
 								                    // And so we will think that the 'cas' job is at the same level as the switch.
 								                    // To address this, if we see that the switch statement was not closed, do not
 								                    // decrement the indent afterwards.
 								                    inc = 1;
 								                    dec = node.parent->as<switch_statement_t>()->end.unsourced ? 0 : 1;
 								                    break;
-												Indent only leaf nodes and in-between gaps

Probably not necessary for the next commit, but this way feels more logical

											
										
										
											2021-02-08 11:42:24 +08:00
+								                case type_t::token_base: {
 								                    auto tok = node.as<token_base_t>();
 								                    if (node.parent->type == type_t::begin_header &&
 								                        tok->type == parse_token_type_t::end) {
 								                        // The newline after "begin" is optional, so it is part of the header.
 								                        // The header is not in the indented block, so indent the newline here.
 								                        if (node.source(src) == L"\n") {
 								                            inc = 1;
 								                            dec = 1;
 								                        }
 								                    }
 								                    break;
 								                }
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								                default:
 								                    break;
-												Fix to indent comments in blocks properly (#1710)

This makes two changes to parse trees:

1. Unmaterialized nodes no longer have an invalid source location
For example, with the code `while false;end` there are no tokens
associated with the while loop's job_list, and therefore it is
unmaterialized. Previously it would have had a SOURCE_OFFSET_INVALID.
But now it has a zero source length, but an offset equal to the end of
the while loop (i.e. the semicolon), and a zero length. Correspondingly,
the has_source function now checks the length instead of the offset.

2. Special (comment and error) nodes have always been "disconnected,"
meaning they are not the child of any other node. However, they now have
their parent offsets set to whatever the top of the node stack was when
the node was encountered. This gives us a sense of which node the
comment is "in", e.g. if we are constructing a job list then the
comment's parent will be the job list. This lets us determine the
comment's indent.

											
										
										
											2014-09-30 02:29:50 +08:00
+								            }
-												Indent only leaf nodes and in-between gaps

Probably not necessary for the next commit, but this way feels more logical

											
										
										
											2021-02-08 11:42:24 +08:00
 								            auto range = node.source_range();
 								            if (range.length > 0 && node.category == category_t::leaf) {
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
+								                record_line_continuations_until(range.start);
-												Indent only leaf nodes and in-between gaps

Probably not necessary for the next commit, but this way feels more logical

											
										
										
											2021-02-08 11:42:24 +08:00
+								                std::fill(indents.begin() + last_leaf_end, indents.begin() + range.start,
 								                          last_indent);
 								            }
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								            indent += inc;
-												Fix to indent comments in blocks properly (#1710)

This makes two changes to parse trees:

1. Unmaterialized nodes no longer have an invalid source location
For example, with the code `while false;end` there are no tokens
associated with the while loop's job_list, and therefore it is
unmaterialized. Previously it would have had a SOURCE_OFFSET_INVALID.
But now it has a zero source length, but an offset equal to the end of
the while loop (i.e. the semicolon), and a zero length. Correspondingly,
the has_source function now checks the length instead of the offset.

2. Special (comment and error) nodes have always been "disconnected,"
meaning they are not the child of any other node. However, they now have
their parent offsets set to whatever the top of the node stack was when
the node was encountered. This gives us a sense of which node the
comment is "in", e.g. if we are constructing a job list then the
comment's parent will be the job list. This lets us determine the
comment's indent.

											
										
										
											2014-09-30 02:29:50 +08:00
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								            // If we increased the indentation, apply it to the remainder of the string, even if the
 								            // list is empty. For example (where _ represents the cursor):
 								            //
 								            //    if foo
 								            //       _
 								            //
 								            // we want to indent the newline.
 								            if (inc) {
 								                last_indent = indent;
 								            }
 								            // If this is a leaf node, apply the current indentation.
-												Refactor: collapse if statements
											
										
										
											2021-02-13 14:48:19 +08:00
+								            if (node.category == category_t::leaf && range.length > 0) {
 								                std::fill(indents.begin() + range.start, indents.begin() + range.end(), indent);
 								                last_leaf_end = range.start + range.length;
 								                last_indent = indent;
-												Rewriting indenting functionality to use new parser

											
										
										
											2013-12-09 05:41:12 +08:00
+								            }
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
 								            node_visitor(*this).accept_children_of(&node);
 								            indent -= dec;
-												Rewriting indenting functionality to use new parser

											
										
										
											2013-12-09 05:41:12 +08:00
+								        }
-												Indent continuations after | and &&

This indents continuations after pipes and conjunctions if they contain
a newline.

Example:

    cmd1 &&
        cmd2

But it avoids the "double indent" if it indented unconditionally:

    cmd1 | begin
        cmd2
    end

More work towards improving #7252

											
										
										
											2020-08-10 03:15:14 +08:00
+								        /// \return whether a maybe_newlines node contains at least one newline.
 								        bool has_newline(const maybe_newlines_t &nls) const {
 								            return nls.source(src).find(L'\n') != wcstring::npos;
 								        }
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
+								        void record_line_continuations_until(size_t offset) {
 								            wcstring gap_text = src.substr(last_leaf_end, offset - last_leaf_end);
 								            size_t escaped_nl = gap_text.find(L"\\\n");
 								            if (escaped_nl == wcstring::npos) return;
-												Do not indent after escaped newline in comment

We do something similar in fish_indent.  This fixes the spurious indent
after comments in share/completions/emerge.fish.

See #7720

											
										
										
											2021-02-17 01:16:05 +08:00
+								            auto line_end = gap_text.begin() + escaped_nl;
 								            if (std::find(gap_text.begin(), line_end, L'#') != line_end) return;
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
+								            auto end = src.begin() + offset;
 								            auto newline = src.begin() + last_leaf_end + escaped_nl + 1;
 								            // The gap text might contain multiple newlines if there are multiple lines that
 								            // don't contain an AST node, for example, comment lines, or lines containing only
 								            // the escaped newline.
 								            do {
 								                line_continuations.push_back(newline - src.begin());
 								                newline = std::find(newline + 1, end, L'\n');
 								            } while (newline != end);
 								        }
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								        // The one-past-the-last index of the most recently encountered leaf node.
 								        // We use this to populate the indents even if there's no tokens in the range.
 								        size_t last_leaf_end{0};
 								        // The last indent which we assigned.
 								        int last_indent{-1};
-												Indent continuations after | and &&

This indents continuations after pipes and conjunctions if they contain
a newline.

Example:

    cmd1 &&
        cmd2

But it avoids the "double indent" if it indented unconditionally:

    cmd1 | begin
        cmd2
    end

More work towards improving #7252

											
										
										
											2020-08-10 03:15:14 +08:00
+								        // The source we are indenting.
 								        const wcstring &src;
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								        // List of indents, which we populate.
 								        std::vector<int> &indents;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								        // Initialize our starting indent to -1, as our top-level node is a job list which
 								        // will immediately increment it.
 								        int indent{-1};
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
 								        // List of locations of escaped newline characters.
 								        std::vector<size_t> line_continuations;
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								    };
-												Indent continuations after | and &&

This indents continuations after pipes and conjunctions if they contain
a newline.

Example:

    cmd1 &&
        cmd2

But it avoids the "double indent" if it indented unconditionally:

    cmd1 | begin
        cmd2
    end

More work towards improving #7252

											
										
										
											2020-08-10 03:15:14 +08:00
+								    indent_visitor_t iv(src, indents);
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								    node_visitor(iv).accept(ast.top());
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
+								    iv.record_line_continuations_until(indents.size());
-												Indent only leaf nodes and in-between gaps

Probably not necessary for the next commit, but this way feels more logical

											
										
										
											2021-02-08 11:42:24 +08:00
+								    std::fill(indents.begin() + iv.last_leaf_end, indents.end(), iv.last_indent);
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
 								    // All newlines now get the *next* indent.
 								    // For example, in this code:
 								    //    if true
 								    //       stuff
 								    // the newline "belongs" to the if statement as it ends its job.
 								    // But when rendered, it visually belongs to the job list.
 								    size_t idx = src_size;
 								    int next_indent = iv.last_indent;
 								    while (idx--) {
 								        if (src.at(idx) == L'\n') {
-												Indent empty lines inside block
											
										
										
											2021-02-08 11:37:50 +08:00
+								            bool empty_middle_line = idx + 1 < src_size && src.at(idx + 1) == L'\n';
 								            if (!empty_middle_line) {
 								                indents.at(idx) = next_indent;
 								            }
-												Adopt the new AST in parse_util_compute_indents

This switches parse_util_compute_indents from parsing with parse_tree to
the new ast.

It also reworks the parse_util_compute_indents tests, because
parse_util_compute_indents will be the backing for fish_indent.

											
										
										
											2020-06-21 09:22:11 +08:00
+								        } else {
 								            next_indent = indents.at(idx);
 								        }
 								    }
-												Indent escaped newlines

Similar to what fish_indent does. After typing "echo \" and hitting return,
the cursor will be indented.

A possible annoyance is that when you have multiple indented lines

	echo 1 \
	    2 \
	    3 \
	    4 \

If you remove lines in the middle with Control-k, the lines below
the deleted one will start jumping around, as they are disconnected
from and reconnected to "echo".

											
										
										
											2021-02-08 12:01:17 +08:00
+								    // Add an extra level of indentation to continuation lines.
 								    for (size_t idx : iv.line_continuations) {
 								        do {
 								            indents.at(idx)++;
 								        } while (++idx < src_size && src.at(idx) != L'\n');
 								    }
-												Rewriting indenting functionality to use new parser

											
										
										
											2013-12-09 05:41:12 +08:00
+								    return indents;
 								}
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Append a syntax error to the given error list.
 								static bool append_syntax_error(parse_error_list_t *errors, size_t source_location,
 								                                const wchar_t *fmt, ...) {
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								    if (!errors) return true;
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    parse_error_t error;
 								    error.source_start = source_location;
 								    error.source_length = 0;
 								    error.code = parse_error_syntax;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    va_list va;
 								    va_start(va, fmt);
 								    error.text = vformat_string(fmt, va);
 								    va_end(va);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								    errors->push_back(std::move(error));
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    return true;
 								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Returns 1 if the specified command is a builtin that may not be used in a pipeline.
-												Eliminate / vet and whitelist some more globals

											
										
										
											2018-09-29 12:58:44 +08:00
+								static const wchar_t *const forbidden_pipe_commands[] = {L"exec", L"case", L"break", L"return",
 								                                                         L"continue"};
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								static int parser_is_pipe_forbidden(const wcstring &word) {
-												cleanup env code and `contains()`

Switch from null terminated arrays to `wcstring_list_t` for lists of
special env var names. Rename `list_contains_string` to `contains` and
modify the latter interface to not rely on a `#define`.

Rename `list_contains_string()` to `contains()` and eliminate the
current variadic implementation. Update all callers of the removed
version to use the string list version.

											
										
										
											2017-04-05 12:28:57 +08:00
+								    return contains(forbidden_pipe_commands, word);
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								}
-												fix `echo -h`

In addition to fixing `echo -h` this includes some debugging related
cleanups I made while investigating the issue.

Fixes #4120

											
										
										
											2017-06-19 13:07:48 +08:00
+								bool parse_util_argument_is_help(const wchar_t *s) {
-												This commit changes wchar.h includes to cwchar, and uses std::
for everything it provides.

											
										
										
											2019-03-13 05:06:01 +08:00
+								    return std::wcscmp(L"-h", s) == 0 || std::wcscmp(L"--help", s) == 0;
-												Remove additional dead code from old parser

											
										
										
											2014-03-19 05:42:38 +08:00
+								}
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								// \return a pointer to the first argument node of an argument_or_redirection_list_t, or nullptr if
 								// there are no arguments.
-												Declare functions in headers or use internal linkage (static)

Found with gcc's -Wmissing-declarations which gives warnings like

	../src/tinyexpr.cpp:61:5: warning: no previous declaration for ‘int get_arity(int)’ [-Wmissing-declarations]
	   61 | int get_arity(const int type) {

The same warnings show up for builtin functions like builtin_bg because they
currently don't include their own headers. I left that.
Also reformat the touched files.

											
										
										
											2020-09-09 04:04:44 +08:00
+								static const ast::argument_t *get_first_arg(const ast::argument_or_redirection_list_t &list) {
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    for (const ast::argument_or_redirection_t &v : list) {
 								        if (v.is_argument()) return &v.argument();
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								    }
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    return nullptr;
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Given a wide character immediately after a dollar sign, return the appropriate error message.
 								/// For example, if wc is @, then the variable name was $@ and we suggest $argv.
 								static const wchar_t *error_format_for_character(wchar_t wc) {
 								    switch (wc) {
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        case L'?': {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            return ERROR_NOT_STATUS;
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        }
 								        case L'#': {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            return ERROR_NOT_ARGV_COUNT;
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        }
 								        case L'@': {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            return ERROR_NOT_ARGV_AT;
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        }
 								        case L'*': {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            return ERROR_NOT_ARGV_STAR;
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        }
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								        case L'$':
 								        case VARIABLE_EXPAND:
 								        case VARIABLE_EXPAND_SINGLE:
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        case VARIABLE_EXPAND_EMPTY: {
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            return ERROR_NOT_PID;
-												restyle switch blocks to match project style

I missed restyling a few "switch" blocks to make them consistent with the rest
of the code base. This fixes that oversight. This should be the final step in
restyling the C++ code to have a consistent style. This also includes a few
trivial cleanups elsewhere.

I also missed restyling the "complete" module when working my way from a to z
so this final change includes restyling that module.

Total lint errors decreased 36%. Cppcheck errors went from 47 to 24. Oclint P2
errors went from 819 to 778. Oclint P3 errors went from 3252 to 1842.

Resolves #2902.

											
										
										
											2016-05-04 07:23:30 +08:00
+								        }
-												Reformat all files

This runs build_tools/style.fish, which runs clang-format on C++, fish_indent on fish and (new) black on python.

If anything is wrong with the formatting, we should fix the tools, but automated formatting is worth it.

											
										
										
											2019-05-05 18:09:25 +08:00
+								        default: {
 								            return ERROR_BAD_VAR_CHAR1;
 								        }
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    }
 								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								void parse_util_expand_variable_error(const wcstring &token, size_t global_token_pos,
 								                                      size_t dollar_pos, parse_error_list_t *errors) {
 								    // Note that dollar_pos is probably VARIABLE_EXPAND or VARIABLE_EXPAND_SINGLE, not a literal
 								    // dollar sign.
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								    assert(errors != nullptr);
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    assert(dollar_pos < token.size());
-												eliminate "useless parentheses" lint errors

Some `oclint` errors regarding "useless parentheses" are meaningfull. But
the vast majority are bogus in as much as removing the parentheses reduces
readability. So fix a few of the egregious uses and otherwise suppress
that error.

											
										
										
											2016-05-04 12:31:32 +08:00
+								    const bool double_quotes = token.at(dollar_pos) == VARIABLE_EXPAND_SINGLE;
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    const size_t start_error_count = errors->size();
 								    const size_t global_dollar_pos = global_token_pos + dollar_pos;
 								    const size_t global_after_dollar_pos = global_dollar_pos + 1;
-												fixes for cppcheck lint warnings

Refine the linting behavior.

Fix several of the, mostly trivial, lint errors.

											
										
										
											2016-04-05 05:34:28 +08:00
+								    wchar_t char_after_dollar = dollar_pos + 1 >= token.size() ? 0 : token.at(dollar_pos + 1);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    switch (char_after_dollar) {
-												Rename BRACKET in reference to `{` to BRACE instead per #3802

This `{` is a curly brace. This `[` is a square bracket.

											
										
										
											2018-03-11 03:16:07 +08:00
+								        case BRACE_BEGIN:
-												fix minor style nits

While investigating issue #3634 I noticed some inconsistent whitespace
that this cleans up.

											
										
										
											2016-12-13 04:35:22 +08:00
+								        case L'{': {
-												Rename BRACKET in reference to `{` to BRACE instead per #3802

This `{` is a curly brace. This `[` is a square bracket.

											
										
										
											2018-03-11 03:16:07 +08:00
+								            // The BRACE_BEGIN is for unquoted, the { is for quoted. Anyways we have (possible
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            // quoted) ${. See if we have a }, and the stuff in between is variable material. If so,
 								            // report a bracket error. Otherwise just complain about the ${.
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            bool looks_like_variable = false;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            size_t closing_bracket =
-												Rename BRACKET in reference to `{` to BRACE instead per #3802

This `{` is a curly brace. This `[` is a square bracket.

											
										
										
											2018-03-11 03:16:07 +08:00
+								                token.find(char_after_dollar == L'{' ? L'}' : wchar_t(BRACE_END), dollar_pos + 2);
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            wcstring var_name;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            if (closing_bracket != wcstring::npos) {
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								                size_t var_start = dollar_pos + 2, var_end = closing_bracket;
 								                var_name = wcstring(token, var_start, var_end - var_start);
-												simplify and clarify valid identifiers

This is the first step in addressing issue #3965. It renames some of the
functions involved in validating variable and function names to clarify
their purpose. It also augments the documentation to make the rules for
such identifiers clearly documented.

											
										
										
											2017-04-20 14:43:02 +08:00
+								                looks_like_variable = valid_var_name(var_name);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            if (looks_like_variable) {
 								                append_syntax_error(
 								                    errors, global_after_dollar_pos,
 								                    double_quotes ? ERROR_BRACKETED_VARIABLE_QUOTED1 : ERROR_BRACKETED_VARIABLE1,
-												parse_util.cpp: remove truncate_string()

We already have something that does this

											
										
										
											2019-09-20 01:32:07 +08:00
+								                    truncate(var_name, var_err_len).c_str());
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            } else {
 								                append_syntax_error(errors, global_after_dollar_pos, ERROR_BAD_VAR_CHAR1, L'{');
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            }
 								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        case INTERNAL_SEPARATOR: {
 								            // e.g.: echo foo"$"baz
 								            // These are only ever quotes, not command substitutions. Command substitutions are
 								            // handled earlier.
 								            append_syntax_error(errors, global_dollar_pos, ERROR_NO_VAR_NAME);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        case '(': {
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            // e.g.: 'echo "foo$(bar)baz"
 								            // Try to determine what's in the parens.
 								            wcstring token_after_parens;
 								            wcstring paren_text;
 								            size_t open_parens = dollar_pos + 1, cmdsub_start = 0, cmdsub_end = 0;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            if (parse_util_locate_cmdsubst_range(token, &open_parens, &paren_text, &cmdsub_start,
 								                                                 &cmdsub_end, true) > 0) {
-												Continue to refine tokenizer interface

Migrate some functions into tokenizer instance methods

											
										
										
											2015-07-26 15:58:32 +08:00
+								                token_after_parens = tok_first(paren_text);
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								            // Make sure we always show something.
 								            if (token_after_parens.empty()) {
-												Ellipsis OCD

											
										
										
											2019-09-20 02:09:37 +08:00
+								                token_after_parens = get_ellipsis_str();
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								            append_syntax_error(errors, global_dollar_pos, ERROR_BAD_VAR_SUBCOMMAND1,
-												parse_util.cpp: remove truncate_string()

We already have something that does this

											
										
										
											2019-09-20 01:32:07 +08:00
+								                                truncate(token_after_parens, var_err_len).c_str());
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        case L'\0': {
 								            append_syntax_error(errors, global_dollar_pos, ERROR_NO_VAR_NAME);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            break;
 								        }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        default: {
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            wchar_t token_stop_char = char_after_dollar;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            // Unescape (see issue #50).
-												Feature flag support for ? wildcard

This partially reverts 6e56637cf0a6036fdea4105e9f33314a3d6e8e78 and #4520
by bringing back the ? wildcard, guarded by the qmark-noglob feature flag.

											
										
										
											2018-05-06 10:11:57 +08:00
+								            if (token_stop_char == ANY_CHAR)
 								                token_stop_char = L'?';
 								            else if (token_stop_char == ANY_STRING || token_stop_char == ANY_STRING_RECURSIVE)
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								                token_stop_char = L'*';
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								            // Determine which error message to use. The format string may not consume all the
 								            // arguments we pass but that's harmless.
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            const wchar_t *error_fmt = error_format_for_character(token_stop_char);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								            append_syntax_error(errors, global_after_dollar_pos, error_fmt, token_stop_char);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            break;
 								        }
 								    }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								    // We should have appended exactly one error.
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    assert(errors->size() == start_error_count + 1);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								}
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Detect cases like $(abc). Given an arg like foo(bar), let arg_src be foo and cmdsubst_src be
 								/// bar. If arg ends with VARIABLE_EXPAND, then report an error.
 								static parser_test_error_bits_t detect_dollar_cmdsub_errors(size_t arg_src_offset,
 								                                                            const wcstring &arg_src,
 								                                                            const wcstring &cmdsubst_src,
 								                                                            parse_error_list_t *out_errors) {
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    parser_test_error_bits_t result_bits = 0;
 								    wcstring unescaped_arg_src;
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
 								    if (!unescape_string(arg_src, &unescaped_arg_src, UNESCAPE_SPECIAL) ||
 								        unescaped_arg_src.empty()) {
 								        return result_bits;
 								    }
 								    wchar_t last = unescaped_arg_src.at(unescaped_arg_src.size() - 1);
 								    if (last == VARIABLE_EXPAND) {
 								        result_bits |= PARSER_TEST_ERROR;
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								        if (out_errors != nullptr) {
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								            wcstring subcommand_first_token = tok_first(cmdsubst_src);
 								            if (subcommand_first_token.empty()) {
 								                // e.g. $(). Report somthing.
-												Ellipsis OCD

											
										
										
											2019-09-20 02:09:37 +08:00
+								                subcommand_first_token = get_ellipsis_str();
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								            }
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								            append_syntax_error(
 								                out_errors,
 								                arg_src_offset + arg_src.size() - 1,  // global position of the dollar
-												parse_util.cpp: remove truncate_string()

We already have something that does this

											
										
										
											2019-09-20 01:32:07 +08:00
+								                ERROR_BAD_VAR_SUBCOMMAND1, truncate(subcommand_first_token, var_err_len).c_str());
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								        }
 								    }
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								    return result_bits;
 								}
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								/// Test if this argument contains any errors. Detected errors include syntax errors in command
 								/// substitutions, improperly escaped characters and improper use of the variable expansion
 								/// operator.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								parser_test_error_bits_t parse_util_detect_errors_in_argument(const ast::argument_t &arg,
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                                                              const wcstring &arg_src,
 								                                                              parse_error_list_t *out_errors) {
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    maybe_t<source_range_t> source_range = arg.try_source_range();
 								    if (!source_range.has_value()) return 0;
 								    size_t source_start = source_range->start;
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								    parser_test_error_bits_t err = 0;
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								    size_t cursor = 0;
 								    wcstring subst;
 								    bool do_loop = true;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    while (do_loop) {
-												Use parse_util_locate_cmdsubst_range when validating arguments

Removes another usage of parse_util_locate_cmdsubst().

											
										
										
											2020-07-15 06:34:26 +08:00
+								        size_t paren_begin = 0;
 								        size_t paren_end = 0;
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								        switch (parse_util_locate_cmdsubst_range(arg_src, &cursor, &subst, &paren_begin, &paren_end,
 								                                                 false)) {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            case -1: {
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								                err |= PARSER_TEST_ERROR;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                if (out_errors) {
-												Migrate parse_util_detect_errors_in_argument to tnode_t

											
										
										
											2018-01-13 03:36:45 +08:00
+								                    append_syntax_error(out_errors, source_start, L"Mismatched parenthesis");
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								                }
 								                return err;
 								            }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            case 0: {
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								                do_loop = false;
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								                break;
 								            }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								            case 1: {
-												Use parse_util_locate_cmdsubst_range when validating arguments

Removes another usage of parse_util_locate_cmdsubst().

											
										
										
											2020-07-15 06:34:26 +08:00
+								                assert(paren_begin < paren_end && "Parens out of order?");
-												Rewrite parser_t::test_args and parser_t::eval_args to use new parser

											
										
										
											2014-03-19 05:14:32 +08:00
+								                parse_error_list_t subst_errors;
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								                err |= parse_util_detect_errors(subst, &subst_errors);
-												Rewrite parser_t::test_args and parser_t::eval_args to use new parser

											
										
										
											2014-03-19 05:14:32 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								                // Our command substitution produced error offsets relative to its source. Tweak the
 								                // offsets of the errors in the command substitution to account for both its offset
 								                // within the string, and the offset of the node.
-												Use parse_util_locate_cmdsubst_range when validating arguments

Removes another usage of parse_util_locate_cmdsubst().

											
										
										
											2020-07-15 06:34:26 +08:00
+								                size_t error_offset = paren_begin + 1 + source_start;
-												Excise use of parser_t's error() functionality. Thread a
parse_error_list_t through all of the expand functions, enabling them to
report errors more directly. Improve aspects of error reporting for
expansion failures.

											
										
										
											2014-03-22 08:13:33 +08:00
+								                parse_error_offset_source_start(&subst_errors, error_offset);
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 10:34:50 +08:00
+								                if (out_errors != nullptr) {
-												Rewrite parser_t::test_args and parser_t::eval_args to use new parser

											
										
										
											2014-03-19 05:14:32 +08:00
+								                    out_errors->insert(out_errors->end(), subst_errors.begin(), subst_errors.end());
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
 								                    // Hackish. Take this opportunity to report $(...) errors. We do this because
 								                    // after we've replaced with internal separators, we can't distinguish between
 								                    // "" and (), and also we no longer have the source of the command substitution.
 								                    // As an optimization, this is only necessary if the last character is a $.
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								                    if (paren_begin > 0 && arg_src.at(paren_begin - 1) == L'$') {
-												Migrate parse_util_detect_errors_in_argument to tnode_t

											
										
										
											2018-01-13 03:36:45 +08:00
+								                        err |= detect_dollar_cmdsub_errors(
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								                            source_start, arg_src.substr(0, paren_begin), subst, out_errors);
-												Rework error messages to be shorter and to handle more special bash-isms

Example: we can point $* to argv

Fixes #1288

											
										
										
											2015-04-30 07:53:02 +08:00
+								                    }
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								                }
 								                break;
 								            }
-												lint: missing default in switch statements

											
										
										
											2016-10-30 08:25:48 +08:00
+								            default: {
 								                DIE("unexpected parse_util_locate_cmdsubst() return value");
 								            }
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								        }
 								    }
 								    wcstring unesc;
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								    if (!unescape_string(arg_src, &unesc, UNESCAPE_SPECIAL)) {
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								        if (out_errors) {
-												More clean up of parse_util_detect_errors_in_argument

											
										
										
											2020-07-15 06:51:12 +08:00
+								            append_syntax_error(out_errors, source_start, L"Invalid token '%ls'", arg_src.c_str());
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								        }
 								        return 1;
-												lint cleanup: eliminate "redundant" errors

This removes some pointless parentheses but the primary focus is removing
redundancies like unnecessary "else" clauses.

											
										
										
											2016-05-05 06:19:47 +08:00
+								    }
 								    // Check for invalid variable expansions.
 								    const size_t unesc_size = unesc.size();
 								    for (size_t idx = 0; idx < unesc_size; idx++) {
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								        if (unesc.at(idx) != VARIABLE_EXPAND && unesc.at(idx) != VARIABLE_EXPAND_SINGLE) {
 								            continue;
 								        }
-												lint: too few branches in switch statement

Someone was way too enamored of the `switch` statement. Using it in
places where a simple `if...else if...else` was clearer and shorter.

											
										
										
											2016-10-23 11:32:25 +08:00
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								        wchar_t next_char = idx + 1 < unesc_size ? unesc.at(idx + 1) : L'\0';
 								        if (next_char != VARIABLE_EXPAND && next_char != VARIABLE_EXPAND_SINGLE &&
-												simplify and clarify valid identifiers

This is the first step in addressing issue #3965. It renames some of the
functions involved in validating variable and function names to clarify
their purpose. It also augments the documentation to make the rules for
such identifiers clearly documented.

											
										
										
											2017-04-20 14:43:02 +08:00
+								            !valid_var_name_char(next_char)) {
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								            err = 1;
 								            if (out_errors) {
 								                // We have something like $$$^....  Back up until we reach the first $.
 								                size_t first_dollar = idx;
-												time for another `make style-all`

											
										
										
											2016-12-04 12:12:53 +08:00
+								                while (first_dollar > 0 && (unesc.at(first_dollar - 1) == VARIABLE_EXPAND ||
 								                                            unesc.at(first_dollar - 1) == VARIABLE_EXPAND_SINGLE)) {
-												lint: Use early exit/continue

											
										
										
											2016-10-31 12:05:27 +08:00
+								                    first_dollar--;
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								                }
-												Migrate parse_util_detect_errors_in_argument to tnode_t

											
										
										
											2018-01-13 03:36:45 +08:00
+								                parse_util_expand_variable_error(unesc, source_start, first_dollar, out_errors);
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								            }
 								        }
 								    }
 								    return err;
 								}
-												Adopt tnode_t in parse_util_detect_errors

											
										
										
											2018-01-13 03:15:35 +08:00
+								/// Given that the job given by node should be backgrounded, return true if we detect any errors.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								static bool detect_errors_in_backgrounded_job(const ast::job_t &job,
-												Adopt tnode_t in parse_util_detect_errors

											
										
										
											2018-01-13 03:15:35 +08:00
+								                                              parse_error_list_t *parse_errors) {
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    using namespace ast;
 								    auto source_range = job.try_source_range();
-												Adopt tnode_t in detect_errors_in_backgrounded_job

											
										
										
											2018-01-14 08:24:21 +08:00
+								    if (!source_range) return false;
-												Adopt tnode_t in parse_util_detect_errors

											
										
										
											2018-01-13 03:15:35 +08:00
+								    bool errored = false;
 								    // Disallow background in the following cases:
 								    // foo & ; and bar
 								    // foo & ; or bar
 								    // if foo & ; end
 								    // while foo & ; end
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    const job_conjunction_t *job_conj = job.parent->try_as<job_conjunction_t>();
 								    if (!job_conj) return false;
 								    if (job_conj->parent->try_as<if_clause_t>()) {
-												Adopt tnode_t in detect_errors_in_backgrounded_job

											
										
										
											2018-01-14 08:24:21 +08:00
+								        errored = append_syntax_error(parse_errors, source_range->start,
 								                                      BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    } else if (job_conj->parent->try_as<while_header_t>()) {
-												Adopt tnode_t in detect_errors_in_backgrounded_job

											
										
										
											2018-01-14 08:24:21 +08:00
+								        errored = append_syntax_error(parse_errors, source_range->start,
 								                                      BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    } else if (const ast::job_list_t *jlist = job_conj->parent->try_as<ast::job_list_t>()) {
-												Adopt tnode_t in detect_errors_in_backgrounded_job

											
										
										
											2018-01-14 08:24:21 +08:00
+								        // This isn't very complete, e.g. we don't catch 'foo & ; not and bar'.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								        // Find the index of ourselves in the job list.
 								        size_t index;
 								        for (index = 0; index < jlist->count(); index++) {
 								            if (jlist->at(index) == job_conj) break;
 								        }
 								        assert(index < jlist->count() && "Should have found the job in the list");
 								        // Try getting the next job and check its decorator.
 								        if (const job_conjunction_t *next = jlist->at(index + 1)) {
 								            if (const keyword_base_t *deco = next->decorator.contents.get()) {
 								                assert(
 								                    (deco->kw == parse_keyword_t::kw_and || deco->kw == parse_keyword_t::kw_or) &&
 								                    "Unexpected decorator keyword");
 								                const wchar_t *deco_name = (deco->kw == parse_keyword_t::kw_and ? L"and" : L"or");
 								                errored = append_syntax_error(parse_errors, deco->source_range().start,
 								                                              BOOL_AFTER_BACKGROUND_ERROR_MSG, deco_name);
-												Adopt tnode_t in parse_util_detect_errors

											
										
										
											2018-01-13 03:15:35 +08:00
+								            }
 								        }
 								    }
 								    return errored;
 								}
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								/// Given a source buffer \p buff_src and decorated statement \p dst within it, return true if there
 								/// is an error and false if not. \p storage may be used to reduce allocations.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								static bool detect_errors_in_decorated_statement(const wcstring &buff_src,
 								                                                 const ast::decorated_statement_t &dst,
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								                                                 wcstring *storage,
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								                                                 parse_error_list_t *parse_errors) {
 								    using namespace ast;
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								    bool errored = false;
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    auto source_start = dst.source_range().start;
-												Make parse_statement_decoration_t a class enum

											
										
										
											2020-07-08 07:28:39 +08:00
+								    const statement_decoration_t decoration = dst.decoration();
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
 								    // Determine if the first argument is help.
 								    bool first_arg_is_help = false;
 								    if (const auto *arg = get_first_arg(dst.args_or_redirs)) {
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								        const wcstring &arg_src = arg->source(buff_src, storage);
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								        first_arg_is_help = parse_util_argument_is_help(arg_src.c_str());
 								    }
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    // Get the statement we are part of.
 								    const statement_t *st = dst.parent->as<statement_t>();
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    // Walk up to the job.
 								    const ast::job_t *job = nullptr;
 								    for (const node_t *cursor = st; job == nullptr; cursor = cursor->parent) {
 								        assert(cursor && "Reached root without finding a job");
 								        job = cursor->try_as<ast::job_t>();
 								    }
 								    assert(job && "Should have found the job");
 								    // Check our pipeline position.
 								    pipeline_position_t pipe_pos;
 								    if (job->continuation.empty()) {
 								        pipe_pos = pipeline_position_t::none;
 								    } else if (&job->statement == st) {
 								        pipe_pos = pipeline_position_t::first;
 								    } else {
 								        pipe_pos = pipeline_position_t::subsequent;
 								    }
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
 								    // Check that we don't try to pipe through exec.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    bool is_in_pipeline = (pipe_pos != pipeline_position_t::none);
-												Make parse_statement_decoration_t a class enum

											
										
										
											2020-07-08 07:28:39 +08:00
+								    if (is_in_pipeline && decoration == statement_decoration_t::exec) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								        errored = append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, L"exec");
 								    }
-												Rework 'and' and 'or' to be "job decorators"

This promotes "and" and "or" from a type of statement to "job
decorators," as a possible prefix on a job. The point is to rationalize
how they interact with && and ||.

In the new world 'and' and 'or' apply to a entire job conjunction, i.e.
they have "lower precedence." Example:

if [ $age -ge 0 ] && [ $age -le 18 ]
   or [ $age -ge 75 ] && [ $age -le 100 ]
   echo "Child or senior"
end

											
										
										
											2018-03-03 10:09:16 +08:00
+								    // This is a somewhat stale check that 'and' and 'or' are not in pipelines, except at the
 								    // beginning. We can't disallow them as commands entirely because we need to support 'and
 								    // --help', etc.
 								    if (pipe_pos == pipeline_position_t::subsequent) {
 								        // check if our command is 'and' or 'or'. This is very clumsy; we don't catch e.g. quoted
 								        // commands.
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								        const wcstring &command = dst.command.source(buff_src, storage);
-												Rework 'and' and 'or' to be "job decorators"

This promotes "and" and "or" from a type of statement to "job
decorators," as a possible prefix on a job. The point is to rationalize
how they interact with && and ||.

In the new world 'and' and 'or' apply to a entire job conjunction, i.e.
they have "lower precedence." Example:

if [ $age -ge 0 ] && [ $age -le 18 ]
   or [ $age -ge 75 ] && [ $age -le 100 ]
   echo "Child or senior"
end

											
										
										
											2018-03-03 10:09:16 +08:00
+								        if (command == L"and" || command == L"or") {
 								            errored =
 								                append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, command.c_str());
 								        }
 								    }
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								    const wcstring &unexp_command = dst.command.source(buff_src, storage);
 								    if (!unexp_command.empty()) {
-												Allow variables in commands

Syntax highlighting for these coming in next commit.

Fixes #154

											
										
										
											2018-08-26 16:41:45 +08:00
+								        wcstring command;
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								        // Check that we can expand the command.
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								        if (expand_to_command_and_args(unexp_command, operation_context_t::empty(), &command,
-												Stop expanding globs in command position when performing error checking

Before running a command, or before importing a command from bash history,
we perform error checking. As part of error checking we expand commands
including variables and globs. If the glob is very large, like `/**`, then
we could hang expanding it.

One fix would be to limit the amount of expansion from the glob, but
instead let's just not expand command globs when performing error checking.

Fixes #7407

											
										
										
											2020-12-21 05:36:12 +08:00
+								                                       nullptr, parse_errors,
 								                                       true /* skip wildcards */) == expand_result_t::error) {
-												Allow variables in commands

Syntax highlighting for these coming in next commit.

Fixes #154

											
										
										
											2018-08-26 16:41:45 +08:00
+								            errored = true;
-												fix incorrectly aligned carat in command expansion errors and more

- fix the carat position expanding e.g. `command $,`
- improve the error reporting for not-allowed command subtitutions
  by figuring out where the expansion failed instead of using
  SOURCE_LOCATION_UNKNOWN
- allow nullptr for parse_util_licate_brackets_range() out_string
  argument if we don't need it to do any work.

Fixes #5812

											
										
										
											2019-04-12 05:28:27 +08:00
+								            parse_error_offset_source_start(parse_errors, source_start);
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								        }
 								        // Check that pipes are sound.
 								        if (!errored && parser_is_pipe_forbidden(command) && is_in_pipeline) {
 								            errored =
 								                append_syntax_error(parse_errors, source_start, EXEC_ERR_MSG, command.c_str());
 								        }
 								        // Check that we don't return from outside a function. But we allow it if it's
 								        // 'return --help'.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								        if (!errored && command == L"return" && !first_arg_is_help) {
 								            // See if we are in a function.
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								            bool found_function = false;
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								            for (const node_t *cursor = &dst; cursor != nullptr; cursor = cursor->parent) {
 								                if (const auto *bs = cursor->try_as<block_statement_t>()) {
 								                    if (bs->header->type == type_t::function_header) {
 								                        found_function = true;
 								                        break;
 								                    }
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								                }
 								            }
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
 								            if (!found_function) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								                errored = append_syntax_error(parse_errors, source_start, INVALID_RETURN_ERR_MSG);
 								            }
 								        }
 								        // Check that we don't break or continue from outside a loop.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								        if (!errored && (command == L"break" || command == L"continue") && !first_arg_is_help) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								            // Walk up until we hit a 'for' or 'while' loop. If we hit a function first,
 								            // stop the search; we can't break an outer loop from inside a function.
 								            // This is a little funny because we can't tell if it's a 'for' or 'while'
 								            // loop from the ancestor alone; we need the header. That is, we hit a
 								            // block_statement, and have to check its header.
 								            bool found_loop = false;
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								            for (const node_t *ancestor = &dst; ancestor != nullptr; ancestor = ancestor->parent) {
 								                const auto *block = ancestor->try_as<block_statement_t>();
 								                if (!block) continue;
 								                if (block->header->type == type_t::for_header ||
 								                    block->header->type == type_t::while_header) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								                    // This is a loop header, so we can break or continue.
 								                    found_loop = true;
 								                    break;
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								                } else if (block->header->type == type_t::function_header) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								                    // This is a function header, so we cannot break or
 								                    // continue. We stop our search here.
 								                    found_loop = false;
 								                    break;
 								                }
 								            }
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								            if (!found_loop) {
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								                errored = append_syntax_error(
 								                    parse_errors, source_start,
 								                    (command == L"break" ? INVALID_BREAK_ERR_MSG : INVALID_CONTINUE_ERR_MSG));
 								            }
 								        }
 								        // Check that we don't do an invalid builtin (issue #1252).
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								        if (!errored && decoration == statement_decoration_t::builtin) {
 								            wcstring command = unexp_command;
 								            if (expand_one(command, expand_flag::skip_cmdsubst, operation_context_t::empty(),
 								                           parse_errors) &&
 								                !builtin_exists(unexp_command)) {
 								                errored = append_syntax_error(parse_errors, source_start, UNKNOWN_BUILTIN_ERR_MSG,
 								                                              unexp_command.c_str());
 								            }
-												Factor our plain statement case of parse_util_detect_errors

Factors out a lot of code into a separate function.

											
										
										
											2018-02-19 05:00:46 +08:00
+								        }
 								    }
 								    return errored;
 								}
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								// Given we have a trailing argument_or_redirection_list, like `begin; end > /dev/null`, verify that
 								// there are no arguments in the list.
 								static bool detect_errors_in_block_redirection_list(
 								    const ast::argument_or_redirection_list_t &args_or_redirs, parse_error_list_t *out_errors) {
 								    if (const auto *first_arg = get_first_arg(args_or_redirs)) {
 								        return append_syntax_error(out_errors, first_arg->source_range().start,
 								                                   BACKGROUND_IN_CONDITIONAL_ERROR_MSG);
 								    }
 								    return false;
 								}
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								parser_test_error_bits_t parse_util_detect_errors(const ast::ast_t &ast, const wcstring &buff_src,
 								                                                  parse_error_list_t *out_errors) {
 								    using namespace ast;
-												Support for error detection in arguments in new parser. Restores error
reporting for bad arguments (e.g. with bad variable names)

											
										
										
											2014-03-04 18:53:34 +08:00
+								    parser_test_error_bits_t res = 0;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Whether we encountered a parse error.
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								    bool errored = false;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Whether we encountered an unclosed block. We detect this via an 'end_command' block without
 								    // source.
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								    bool has_unclosed_block = false;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												Teach parse_util_detect_errors about unterminated pipelines

Allow it to return PARSER_TEST_INCOMPLETE for code like
`echo | `

											
										
										
											2018-02-19 05:13:58 +08:00
+								    // Whether we encounter a missing statement, i.e. a newline after a pipe. This is found by
 								    // detecting job_continuations that have source for pipes but not the statement.
 								    bool has_unclosed_pipe = false;
-												Allow newlines after && and ||

We do the same for pipes (#1285). This matches POSIX sh behavior.

											
										
										
											2020-08-05 03:39:37 +08:00
+								    // Whether we encounter a missing job, i.e. a newline after && or ||. This is found by
 								    // detecting job_conjunction_continuations that have source for && or || but not the job.
 								    bool has_unclosed_conjunction = false;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    // Expand all commands.
 								    // Verify 'or' and 'and' not used inside pipelines.
 								    // Verify pipes via parser_is_pipe_forbidden.
 								    // Verify return only within a function.
 								    // Verify no variable expansions.
-												Reduce allocation churn in parse_util_detect_errors

Reuse a single string for storage.

											
										
										
											2020-07-13 03:51:17 +08:00
+								    wcstring storage;
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
-												Reformat CPP files

											
										
										
											2020-08-05 03:41:14 +08:00
+								    for (const node_t &node : ast) {
 								        if (const job_continuation_t *jc = node.try_as<job_continuation_t>()) {
 								            // Somewhat clumsy way of checking for a statement without source in a pipeline.
 								            // See if our pipe has source but our statement does not.
 								            if (!jc->pipe.unsourced && !jc->statement.try_source_range().has_value()) {
 								                has_unclosed_pipe = true;
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								            }
-												Allow newlines after && and ||

We do the same for pipes (#1285). This matches POSIX sh behavior.

											
										
										
											2020-08-05 03:39:37 +08:00
+								        } else if (const auto *jcc = node.try_as<job_conjunction_continuation_t>()) {
 								            // Somewhat clumsy way of checking for a job without source in a conjunction.
 								            // See if our conjunction operator (&& or ||) has source but our job does not.
 								            if (!jcc->conjunction.unsourced && !jcc->job.try_source_range().has_value()) {
 								                has_unclosed_conjunction = true;
 								            }
-												Reformat CPP files

											
										
										
											2020-08-05 03:41:14 +08:00
+								        } else if (const argument_t *arg = node.try_as<argument_t>()) {
 								            const wcstring &arg_src = arg->source(buff_src, &storage);
 								            res |= parse_util_detect_errors_in_argument(*arg, arg_src, out_errors);
 								        } else if (const ast::job_t *job = node.try_as<ast::job_t>()) {
 								            // Disallow background in the following cases:
 								            //
 								            // foo & ; and bar
 								            // foo & ; or bar
 								            // if foo & ; end
 								            // while foo & ; end
 								            // If it's not a background job, nothing to do.
 								            if (job->bg) {
 								                errored |= detect_errors_in_backgrounded_job(*job, out_errors);
 								            }
 								        } else if (const ast::decorated_statement_t *stmt = node.try_as<decorated_statement_t>()) {
 								            errored |= detect_errors_in_decorated_statement(buff_src, *stmt, &storage, out_errors);
 								        } else if (const auto *block = node.try_as<block_statement_t>()) {
 								            // If our 'end' had no source, we are unsourced.
 								            if (block->end.unsourced) has_unclosed_block = true;
 								            errored |= detect_errors_in_block_redirection_list(block->args_or_redirs, out_errors);
 								        } else if (const auto *ifs = node.try_as<if_statement_t>()) {
 								            // If our 'end' had no source, we are unsourced.
 								            if (ifs->end.unsourced) has_unclosed_block = true;
 								            errored |= detect_errors_in_block_redirection_list(ifs->args_or_redirs, out_errors);
 								        } else if (const auto *switchs = node.try_as<switch_statement_t>()) {
 								            // If our 'end' had no source, we are unsourced.
 								            if (switchs->end.unsourced) has_unclosed_block = true;
 								            errored |= detect_errors_in_block_redirection_list(switchs->args_or_redirs, out_errors);
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								        }
-												Reformat CPP files

											
										
										
											2020-08-05 03:41:14 +08:00
+								    }
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
+								    if (errored) res |= PARSER_TEST_ERROR;
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
-												Allow newlines after && and ||

We do the same for pipes (#1285). This matches POSIX sh behavior.

											
										
										
											2020-08-05 03:39:37 +08:00
+								    if (has_unclosed_block || has_unclosed_pipe || has_unclosed_conjunction)
 								        res |= PARSER_TEST_INCOMPLETE;
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
 								    return res;
 								}
 								parser_test_error_bits_t parse_util_detect_errors(const wcstring &buff_src,
 								                                                  parse_error_list_t *out_errors,
 								                                                  bool allow_incomplete) {
 								    // Whether there's an unclosed quote or subshell, and therefore unfinished. This is only set if
 								    // allow_incomplete is set.
 								    bool has_unclosed_quote_or_subshell = false;
-												Update style and formatting to conform to fish style guide.

											
										
										
											2014-01-15 17:40:40 +08:00
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								    const parse_tree_flags_t parse_flags =
 								        allow_incomplete ? parse_flag_leave_unterminated : parse_flag_none;
 								    // Parse the input string into an ast. Some errors are detected here.
 								    using namespace ast;
 								    parse_error_list_t parse_errors;
 								    auto ast = ast_t::parse(buff_src, parse_flags, &parse_errors);
 								    if (allow_incomplete) {
 								        // Issue #1238: If the only error was unterminated quote, then consider this to have parsed
 								        // successfully.
 								        size_t idx = parse_errors.size();
 								        while (idx--) {
 								            if (parse_errors.at(idx).code == parse_error_tokenizer_unterminated_quote ||
 								                parse_errors.at(idx).code == parse_error_tokenizer_unterminated_subshell) {
 								                // Remove this error, since we don't consider it a real error.
 								                has_unclosed_quote_or_subshell = true;
 								                parse_errors.erase(parse_errors.begin() + idx);
 								            }
 								        }
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								    }
-												restyle parse_util module to match project style

Reduces lint errors from 187 to 91 (-51%). Line count from 1754 to 1477 (-16%).

Another step in resolving issue #2902.

											
										
										
											2016-05-03 07:53:10 +08:00
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								    // has_unclosed_quote_or_subshell may only be set if allow_incomplete is true.
 								    assert(!has_unclosed_quote_or_subshell || allow_incomplete);
 								    if (has_unclosed_quote_or_subshell) {
 								        // We do not bother to validate the rest of the tree in this case.
 								        return PARSER_TEST_INCOMPLETE;
-												Re-use the parse tree generated during error detection for execution

Prior to this fix, read_ni would use parse_util_detect_errors
to lint the script to run, and then parser_t::eval() to execute it.
Both functions would parse the script into a parse tree. This allows
us to re-use the parse tree, improving perfomance.

											
										
										
											2016-02-28 16:44:20 +08:00
+								    }
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
-												Reduce copying in parse_util_detect_errors

Allow parse_util_detect_errors to accept an already-parsed ast. This
eliminates a copy of the source, which is helpful when executing large
scripts.

											
										
										
											2020-07-13 04:55:51 +08:00
+								    // Early parse error, stop here.
 								    if (!parse_errors.empty()) {
 								        if (out_errors) vec_append(*out_errors, std::move(parse_errors));
 								        return PARSER_TEST_ERROR;
 								    }
 								    // Defer to the tree-walking version.
 								    return parse_util_detect_errors(ast, buff_src, out_errors);
-												Initial work on backtrace support with new parser

											
										
										
											2013-12-16 08:05:37 +08:00
+								}
-												Migrate parse_util_detect_errors to a free function

											
										
										
											2019-08-05 05:49:56 +08:00
 								maybe_t<wcstring> parse_util_detect_errors_in_argument_list(const wcstring &arg_list_src,
 								                                                            const wcstring &prefix) {
 								    // Helper to return a description of the first error.
 								    auto get_error_text = [&](const parse_error_list_t &errors) {
 								        assert(!errors.empty() && "Expected an error");
 								        return errors.at(0).describe_with_prefix(arg_list_src, prefix, false /* not interactive */,
 								                                                 false /* don't skip caret */);
 								    };
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    // Parse the string as a freestanding argument list.
 								    using namespace ast;
-												Migrate parse_util_detect_errors to a free function

											
										
										
											2019-08-05 05:49:56 +08:00
+								    parse_error_list_t errors;
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    auto ast = ast_t::parse_argument_list(arg_list_src, parse_flag_none, &errors);
 								    if (!errors.empty()) {
-												Migrate parse_util_detect_errors to a free function

											
										
										
											2019-08-05 05:49:56 +08:00
+								        return get_error_text(errors);
 								    }
 								    // Get the root argument list and extract arguments from it.
 								    // Test each of these.
-												Adopt the new AST in parse_util_detect_errors

This switches parse_util_detect_errors from parsing with parse_tree to
the new ast.

											
										
										
											2020-07-02 12:06:58 +08:00
+								    for (const argument_t &arg : ast.top()->as<freestanding_argument_list_t>()->arguments) {
 								        const wcstring arg_src = arg.source(arg_list_src);
-												Migrate parse_util_detect_errors to a free function

											
										
										
											2019-08-05 05:49:56 +08:00
+								        if (parse_util_detect_errors_in_argument(arg, arg_src, &errors)) {
 								            return get_error_text(errors);
 								        }
 								    }
 								    return none();
 								}