2016-04-28 07:10:14 +08:00
|
|
|
// Various functions, mostly string utilities, that are used by most parts of fish.
|
2005-10-05 17:58:00 +08:00
|
|
|
#include "config.h"
|
|
|
|
|
2015-07-25 23:14:25 +08:00
|
|
|
#include <assert.h>
|
2016-05-16 10:45:02 +08:00
|
|
|
#include <cxxabi.h>
|
|
|
|
#include <dlfcn.h>
|
2005-09-20 21:26:39 +08:00
|
|
|
#include <errno.h>
|
|
|
|
#include <limits.h>
|
2016-04-28 07:10:14 +08:00
|
|
|
#include <signal.h>
|
2012-11-19 08:30:30 +08:00
|
|
|
#include <stdarg.h>
|
2016-04-21 14:00:54 +08:00
|
|
|
#include <stddef.h>
|
2016-04-28 07:10:14 +08:00
|
|
|
#include <stdint.h>
|
|
|
|
#include <stdio.h>
|
|
|
|
#include <stdlib.h>
|
|
|
|
#include <string.h>
|
|
|
|
#include <sys/stat.h>
|
2005-09-28 09:43:09 +08:00
|
|
|
#include <sys/time.h>
|
2016-04-28 07:10:14 +08:00
|
|
|
#include <termios.h>
|
|
|
|
#include <unistd.h>
|
|
|
|
#include <wchar.h>
|
|
|
|
#include <wctype.h>
|
2007-01-20 10:36:49 +08:00
|
|
|
#ifdef HAVE_EXECINFO_H
|
|
|
|
#include <execinfo.h>
|
|
|
|
#endif
|
2016-04-28 07:10:14 +08:00
|
|
|
#ifdef HAVE_SIGINFO_H
|
|
|
|
#include <siginfo.h>
|
|
|
|
#endif
|
|
|
|
#ifdef HAVE_SYS_IOCTL_H
|
|
|
|
#include <sys/ioctl.h>
|
|
|
|
#endif
|
|
|
|
#include <algorithm>
|
|
|
|
#include <memory> // IWYU pragma: keep
|
2007-01-20 10:36:49 +08:00
|
|
|
|
2005-09-20 21:26:39 +08:00
|
|
|
#include "common.h"
|
|
|
|
#include "expand.h"
|
2016-04-28 07:10:14 +08:00
|
|
|
#include "fallback.h" // IWYU pragma: keep
|
2005-09-20 21:26:39 +08:00
|
|
|
#include "wildcard.h"
|
2016-04-28 07:10:14 +08:00
|
|
|
#include "wutil.h" // IWYU pragma: keep
|
2005-09-20 21:26:39 +08:00
|
|
|
|
2014-05-14 13:30:41 +08:00
|
|
|
#define NOT_A_WCHAR (static_cast<wint_t>(WEOF))
|
2012-03-02 16:27:40 +08:00
|
|
|
|
2012-11-19 08:30:30 +08:00
|
|
|
struct termios shell_modes;
|
2005-09-20 21:26:39 +08:00
|
|
|
|
2012-05-14 11:19:02 +08:00
|
|
|
// Note we foolishly assume that pthread_t is just a primitive. But it might be a struct.
|
2012-01-06 05:58:48 +08:00
|
|
|
static pthread_t main_thread_id = 0;
|
2012-05-14 11:19:02 +08:00
|
|
|
static bool thread_assertions_configured_for_testing = false;
|
2012-01-06 05:58:48 +08:00
|
|
|
|
2012-11-05 16:05:42 +08:00
|
|
|
wchar_t ellipsis_char;
|
2012-12-02 07:44:09 +08:00
|
|
|
wchar_t omitted_newline_char;
|
2014-02-10 06:04:43 +08:00
|
|
|
bool g_profiling_active = false;
|
2011-12-27 11:18:46 +08:00
|
|
|
const wchar_t *program_name;
|
2016-05-16 10:45:02 +08:00
|
|
|
int debug_level = 1; // default maximum debug output level (errors and warnings)
|
|
|
|
int debug_stack_frames = 0; // default number of stack frames to show on debug() calls
|
|
|
|
|
|
|
|
/// This allows us to notice when we've forked.
|
|
|
|
static pid_t initial_pid = 0;
|
2005-09-20 21:26:39 +08:00
|
|
|
|
2016-05-16 10:45:02 +08:00
|
|
|
/// Be able to restore the term's foreground process group.
|
|
|
|
static pid_t initial_foreground_process_group = -1;
|
2005-09-25 03:31:17 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// This struct maintains the current state of the terminal size. It is updated on demand after
|
|
|
|
/// receiving a SIGWINCH. Do not touch this struct directly, it's managed with a rwlock. Use
|
|
|
|
/// common_get_width()/common_get_height().
|
2005-10-14 19:40:33 +08:00
|
|
|
static struct winsize termsize;
|
2014-08-24 15:59:03 +08:00
|
|
|
static volatile bool termsize_valid;
|
|
|
|
static rwlock_t termsize_rwlock;
|
2005-10-14 19:40:33 +08:00
|
|
|
|
2012-12-13 07:44:01 +08:00
|
|
|
static char *wcs2str_internal(const wchar_t *in, char *out);
|
2016-05-20 10:27:22 +08:00
|
|
|
static void debug_shared(const wchar_t msg_level, const wcstring &msg);
|
2007-01-20 10:36:49 +08:00
|
|
|
|
2016-06-18 04:08:25 +08:00
|
|
|
bool has_working_tty_timestamps = true;
|
|
|
|
|
2016-05-20 10:27:22 +08:00
|
|
|
#ifdef HAVE_BACKTRACE_SYMBOLS
|
2016-05-16 10:45:02 +08:00
|
|
|
// This function produces a stack backtrace with demangled function & method names. It is based on
|
|
|
|
// https://gist.github.com/fmela/591333 but adapted to the style of the fish project.
|
|
|
|
static const wcstring_list_t __attribute__((noinline))
|
|
|
|
demangled_backtrace(int max_frames, int skip_levels) {
|
|
|
|
void *callstack[128];
|
|
|
|
const int n_max_frames = sizeof(callstack) / sizeof(callstack[0]);
|
|
|
|
int n_frames = backtrace(callstack, n_max_frames);
|
|
|
|
char **symbols = backtrace_symbols(callstack, n_frames);
|
|
|
|
wchar_t text[1024];
|
|
|
|
std::vector<wcstring> backtrace_text;
|
|
|
|
|
|
|
|
if (skip_levels + max_frames < n_frames) n_frames = skip_levels + max_frames;
|
|
|
|
|
|
|
|
for (int i = skip_levels; i < n_frames; i++) {
|
|
|
|
Dl_info info;
|
|
|
|
if (dladdr(callstack[i], &info) && info.dli_sname) {
|
|
|
|
char *demangled = NULL;
|
|
|
|
int status = -1;
|
|
|
|
if (info.dli_sname[0] == '_')
|
|
|
|
demangled = abi::__cxa_demangle(info.dli_sname, NULL, 0, &status);
|
|
|
|
swprintf(text, sizeof(text) / sizeof(wchar_t), L"%-3d %s + %td", i - skip_levels,
|
|
|
|
status == 0 ? demangled : info.dli_sname == 0 ? symbols[i] : info.dli_sname,
|
|
|
|
(char *)callstack[i] - (char *)info.dli_saddr);
|
|
|
|
free(demangled);
|
|
|
|
} else {
|
|
|
|
swprintf(text, sizeof(text) / sizeof(wchar_t), L"%-3d %s", i - skip_levels, symbols[i]);
|
|
|
|
}
|
|
|
|
backtrace_text.push_back(text);
|
|
|
|
}
|
|
|
|
free(symbols);
|
|
|
|
return backtrace_text;
|
|
|
|
}
|
|
|
|
|
2016-05-23 10:00:13 +08:00
|
|
|
void __attribute__((noinline))
|
|
|
|
show_stackframe(const wchar_t msg_level, int frame_count, int skip_levels) {
|
2013-01-12 07:09:33 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2016-10-21 09:53:31 +08:00
|
|
|
if (frame_count < 1) return;
|
2013-01-13 04:55:23 +08:00
|
|
|
|
2016-05-19 08:46:13 +08:00
|
|
|
// TODO: Decide if this is still needed. I'm commenting it out because it caused me some grief
|
|
|
|
// while trying to debug a test failure. And the tests run just fine without spurious failures
|
|
|
|
// if this check is not done.
|
|
|
|
//
|
2016-04-28 07:10:14 +08:00
|
|
|
// Hack to avoid showing backtraces in the tester.
|
2016-05-19 08:46:13 +08:00
|
|
|
// if (program_name && !wcscmp(program_name, L"(ignore)")) return;
|
2007-01-20 10:36:49 +08:00
|
|
|
|
2016-05-16 10:45:02 +08:00
|
|
|
debug_shared(msg_level, L"Backtrace:");
|
|
|
|
std::vector<wcstring> bt = demangled_backtrace(frame_count, skip_levels + 2);
|
2016-10-10 05:36:08 +08:00
|
|
|
for (int i = 0; (size_t)i < bt.size(); i++) {
|
2016-05-16 10:45:02 +08:00
|
|
|
debug_shared(msg_level, bt[i]);
|
|
|
|
}
|
2007-01-20 10:36:49 +08:00
|
|
|
}
|
|
|
|
|
2016-05-23 10:00:13 +08:00
|
|
|
#else // HAVE_BACKTRACE_SYMBOLS
|
2016-05-20 10:27:22 +08:00
|
|
|
|
2016-05-23 10:00:13 +08:00
|
|
|
void __attribute__((noinline))
|
|
|
|
show_stackframe(const wchar_t msg_level, int frame_count, int skip_levels) {
|
2016-05-20 10:27:22 +08:00
|
|
|
debug_shared(msg_level, L"Sorry, but your system does not support backtraces");
|
|
|
|
}
|
2016-05-23 10:00:13 +08:00
|
|
|
#endif // HAVE_BACKTRACE_SYMBOLS
|
2016-05-20 10:27:22 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int fgetws2(wcstring *s, FILE *f) {
|
|
|
|
int i = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
wint_t c;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while (1) {
|
|
|
|
errno = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-03-11 10:17:39 +08:00
|
|
|
c = fgetwc(f);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (errno == EILSEQ || errno == EINTR) {
|
2012-11-19 08:30:30 +08:00
|
|
|
continue;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
switch (c) {
|
|
|
|
// End of line.
|
2012-11-19 16:31:03 +08:00
|
|
|
case WEOF:
|
|
|
|
case L'\n':
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\0': {
|
2012-11-19 16:31:03 +08:00
|
|
|
return i;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
// Ignore carriage returns.
|
|
|
|
case L'\r': {
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
default: {
|
2012-11-19 16:31:03 +08:00
|
|
|
i++;
|
|
|
|
s->push_back((wchar_t)c);
|
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Converts the narrow character string \c in into its wide equivalent, and return it.
|
|
|
|
///
|
|
|
|
/// The string may contain embedded nulls.
|
|
|
|
///
|
|
|
|
/// This function encodes illegal character sequences in a reversible way using the private use
|
|
|
|
/// area.
|
|
|
|
static wcstring str2wcs_internal(const char *in, const size_t in_len) {
|
|
|
|
if (in_len == 0) return wcstring();
|
2012-12-21 04:25:35 +08:00
|
|
|
assert(in != NULL);
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-12-21 04:25:35 +08:00
|
|
|
wcstring result;
|
|
|
|
result.reserve(in_len);
|
|
|
|
size_t in_pos = 0;
|
2016-03-11 10:17:39 +08:00
|
|
|
|
2016-05-23 10:00:13 +08:00
|
|
|
if (MB_CUR_MAX == 1) {
|
|
|
|
// Single-byte locale, all values are legal.
|
2016-04-28 07:10:14 +08:00
|
|
|
while (in_pos < in_len) {
|
2016-03-11 10:17:39 +08:00
|
|
|
result.push_back((unsigned char)in[in_pos]);
|
|
|
|
in_pos++;
|
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
|
|
|
mbstate_t state = {};
|
2016-04-28 07:10:14 +08:00
|
|
|
while (in_pos < in_len) {
|
2016-05-19 08:46:13 +08:00
|
|
|
bool use_encode_direct = false;
|
2016-07-30 18:08:57 +08:00
|
|
|
size_t ret = 0;
|
2012-12-21 04:25:35 +08:00
|
|
|
wchar_t wc = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-05-19 08:46:13 +08:00
|
|
|
if ((in[in_pos] & 0xF8) == 0xF8) {
|
|
|
|
// Protect against broken mbrtowc() implementations which attempt to encode UTF-8
|
|
|
|
// sequences longer than four bytes (e.g., OS X Snow Leopard).
|
2012-12-21 04:25:35 +08:00
|
|
|
use_encode_direct = true;
|
2016-05-23 10:00:13 +08:00
|
|
|
} else if (sizeof(wchar_t) == 2 && (in[in_pos] & 0xF8) == 0xF0) {
|
|
|
|
// Assume we are in a UTF-16 environment (e.g., Cygwin) using a UTF-8 encoding.
|
|
|
|
// The bits set check will be true for a four byte UTF-8 sequence that requires
|
|
|
|
// two UTF-16 chars. Something that doesn't work with our simple use of mbrtowc().
|
|
|
|
use_encode_direct = true;
|
2016-05-19 08:46:13 +08:00
|
|
|
} else {
|
|
|
|
ret = mbrtowc(&wc, &in[in_pos], in_len - in_pos, &state);
|
2016-05-23 10:00:13 +08:00
|
|
|
// fprintf(stderr, "WTF in_pos %d ret %d\n", in_pos, ret);
|
2016-05-19 08:46:13 +08:00
|
|
|
|
2016-05-23 10:00:13 +08:00
|
|
|
// Determine whether to encode this character with our crazy scheme.
|
2016-05-19 08:46:13 +08:00
|
|
|
if (wc >= ENCODE_DIRECT_BASE && wc < ENCODE_DIRECT_BASE + 256) {
|
|
|
|
use_encode_direct = true;
|
|
|
|
} else if (wc == INTERNAL_SEPARATOR) {
|
|
|
|
use_encode_direct = true;
|
|
|
|
} else if (ret == (size_t)-2) {
|
|
|
|
// Incomplete sequence.
|
|
|
|
use_encode_direct = true;
|
|
|
|
} else if (ret == (size_t)-1) {
|
|
|
|
// Invalid data.
|
|
|
|
use_encode_direct = true;
|
|
|
|
} else if (ret > in_len - in_pos) {
|
|
|
|
// Other error codes? Terrifying, should never happen.
|
|
|
|
use_encode_direct = true;
|
2016-05-23 10:00:13 +08:00
|
|
|
} else if (sizeof(wchar_t) == 2 && wc >= 0xD800 && wc <= 0xDFFF) {
|
|
|
|
// If we get a surrogate pair char on a UTF-16 system (e.g., Cygwin) then
|
|
|
|
// it's guaranteed the UTF-8 decoding is wrong so use direct encoding.
|
|
|
|
use_encode_direct = true;
|
2016-05-19 08:46:13 +08:00
|
|
|
}
|
2012-12-21 04:25:35 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (use_encode_direct) {
|
2016-05-23 10:00:13 +08:00
|
|
|
// fprintf(stderr, "WTF use_encode_direct\n");
|
2012-12-21 04:25:35 +08:00
|
|
|
wc = ENCODE_DIRECT_BASE + (unsigned char)in[in_pos];
|
|
|
|
result.push_back(wc);
|
2012-11-19 08:30:30 +08:00
|
|
|
in_pos++;
|
2014-12-08 14:17:44 +08:00
|
|
|
memset(&state, 0, sizeof state);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (ret == 0) {
|
2016-05-23 10:00:13 +08:00
|
|
|
// fprintf(stderr, "WTF null byte\n");
|
2016-04-28 07:10:14 +08:00
|
|
|
// Embedded null byte!
|
2012-12-21 04:25:35 +08:00
|
|
|
result.push_back(L'\0');
|
|
|
|
in_pos++;
|
2014-12-08 14:17:44 +08:00
|
|
|
memset(&state, 0, sizeof state);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2016-05-23 10:00:13 +08:00
|
|
|
// fprintf(stderr, "WTF null byte\n");
|
2016-04-28 07:10:14 +08:00
|
|
|
// Normal case.
|
2012-12-21 04:25:35 +08:00
|
|
|
result.push_back(wc);
|
|
|
|
in_pos += ret;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
}
|
2012-12-21 04:25:35 +08:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring str2wcstring(const char *in, size_t len) { return str2wcs_internal(in, len); }
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring str2wcstring(const char *in) { return str2wcs_internal(in, strlen(in)); }
|
2012-12-21 04:25:35 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring str2wcstring(const std::string &in) {
|
2016-05-19 08:46:13 +08:00
|
|
|
// Handles embedded nulls!
|
2012-12-21 04:25:35 +08:00
|
|
|
return str2wcs_internal(in.data(), in.size());
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
char *wcs2str(const wchar_t *in) {
|
|
|
|
if (!in) return NULL;
|
|
|
|
size_t desired_size = MAX_UTF8_BYTES * wcslen(in) + 1;
|
2012-03-09 15:21:07 +08:00
|
|
|
char local_buff[512];
|
2016-04-28 07:10:14 +08:00
|
|
|
if (desired_size <= sizeof local_buff / sizeof *local_buff) {
|
|
|
|
// Convert into local buff, then use strdup() so we don't waste malloc'd space.
|
2012-03-09 15:21:07 +08:00
|
|
|
char *result = wcs2str_internal(in, local_buff);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (result) {
|
|
|
|
// It converted into the local buffer, so copy it.
|
2012-03-09 15:21:07 +08:00
|
|
|
result = strdup(result);
|
2016-05-05 06:19:47 +08:00
|
|
|
if (!result) DIE_MEM();
|
2012-03-09 15:21:07 +08:00
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
2016-05-05 06:19:47 +08:00
|
|
|
|
|
|
|
// Here we probably allocate a buffer probably much larger than necessary.
|
|
|
|
char *out = (char *)malloc(MAX_UTF8_BYTES * wcslen(in) + 1);
|
|
|
|
if (!out) DIE_MEM();
|
|
|
|
return wcs2str_internal(in, out);
|
2006-02-08 22:58:47 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
char *wcs2str(const wcstring &in) { return wcs2str(in.c_str()); }
|
2013-01-13 06:18:34 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// This function is distinguished from wcs2str_internal in that it allows embedded null bytes.
|
|
|
|
std::string wcs2string(const wcstring &input) {
|
2012-12-13 07:44:01 +08:00
|
|
|
std::string result;
|
|
|
|
result.reserve(input.size());
|
2012-12-20 05:31:06 +08:00
|
|
|
|
2016-03-11 10:17:39 +08:00
|
|
|
mbstate_t state = {};
|
2012-12-13 13:09:42 +08:00
|
|
|
char converted[MB_LEN_MAX + 1];
|
2012-12-20 05:31:06 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t i = 0; i < input.size(); i++) {
|
2012-12-13 07:44:01 +08:00
|
|
|
wchar_t wc = input[i];
|
2016-04-28 07:10:14 +08:00
|
|
|
if (wc == INTERNAL_SEPARATOR) {
|
2016-03-11 10:17:39 +08:00
|
|
|
// Do nothing.
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (wc >= ENCODE_DIRECT_BASE && wc < ENCODE_DIRECT_BASE + 256) {
|
2012-12-13 07:44:01 +08:00
|
|
|
result.push_back(wc - ENCODE_DIRECT_BASE);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (MB_CUR_MAX == 1) // single-byte locale (C/POSIX/ISO-8859)
|
2016-03-11 10:17:39 +08:00
|
|
|
{
|
|
|
|
// If `wc` contains a wide character we emit a question-mark.
|
2016-04-28 07:10:14 +08:00
|
|
|
if (wc & ~0xFF) {
|
2016-03-11 10:17:39 +08:00
|
|
|
wc = '?';
|
|
|
|
}
|
|
|
|
converted[0] = wc;
|
|
|
|
result.append(converted, 1);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2014-12-08 14:17:44 +08:00
|
|
|
memset(converted, 0, sizeof converted);
|
2012-12-13 07:44:01 +08:00
|
|
|
size_t len = wcrtomb(converted, wc, &state);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (len == (size_t)(-1)) {
|
2012-12-13 07:44:01 +08:00
|
|
|
debug(1, L"Wide character %d has no narrow representation", wc);
|
|
|
|
memset(&state, 0, sizeof(state));
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-12-13 07:44:01 +08:00
|
|
|
result.append(converted, len);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2012-12-20 05:31:06 +08:00
|
|
|
|
2011-12-27 11:18:46 +08:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Converts the wide character string \c in into it's narrow equivalent, stored in \c out. \c out
|
|
|
|
/// must have enough space to fit the entire string.
|
|
|
|
///
|
|
|
|
/// This function decodes illegal character sequences in a reversible way using the private use
|
|
|
|
/// area.
|
|
|
|
static char *wcs2str_internal(const wchar_t *in, char *out) {
|
2012-11-19 08:30:30 +08:00
|
|
|
CHECK(in, 0);
|
|
|
|
CHECK(out, 0);
|
|
|
|
|
2016-03-11 10:17:39 +08:00
|
|
|
size_t in_pos = 0;
|
|
|
|
size_t out_pos = 0;
|
|
|
|
mbstate_t state = {};
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while (in[in_pos]) {
|
|
|
|
if (in[in_pos] == INTERNAL_SEPARATOR) {
|
2016-03-11 10:17:39 +08:00
|
|
|
// Do nothing.
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (in[in_pos] >= ENCODE_DIRECT_BASE && in[in_pos] < ENCODE_DIRECT_BASE + 256) {
|
|
|
|
out[out_pos++] = in[in_pos] - ENCODE_DIRECT_BASE;
|
|
|
|
} else if (MB_CUR_MAX == 1) // single-byte locale (C/POSIX/ISO-8859)
|
2016-03-11 10:17:39 +08:00
|
|
|
{
|
|
|
|
// If `wc` contains a wide character we emit a question-mark.
|
2016-04-28 07:10:14 +08:00
|
|
|
if (in[in_pos] & ~0xFF) {
|
2016-03-11 10:17:39 +08:00
|
|
|
out[out_pos++] = '?';
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2016-03-11 10:17:39 +08:00
|
|
|
out[out_pos++] = (unsigned char)in[in_pos];
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2016-03-11 10:17:39 +08:00
|
|
|
size_t len = wcrtomb(&out[out_pos], in[in_pos], &state);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (len == (size_t)-1) {
|
2012-11-19 08:30:30 +08:00
|
|
|
debug(1, L"Wide character %d has no narrow representation", in[in_pos]);
|
|
|
|
memset(&state, 0, sizeof(state));
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2016-03-11 10:17:39 +08:00
|
|
|
out_pos += len;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
in_pos++;
|
|
|
|
}
|
|
|
|
out[out_pos] = 0;
|
|
|
|
|
|
|
|
return out;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring format_string(const wchar_t *format, ...) {
|
2012-11-19 08:30:30 +08:00
|
|
|
va_list va;
|
|
|
|
va_start(va, format);
|
2012-02-10 10:43:36 +08:00
|
|
|
wcstring result = vformat_string(format, va);
|
2012-11-19 08:30:30 +08:00
|
|
|
va_end(va);
|
2012-02-10 10:43:36 +08:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void append_formatv(wcstring &target, const wchar_t *format, va_list va_orig) {
|
2012-03-04 11:12:06 +08:00
|
|
|
const int saved_err = errno;
|
2016-04-28 07:10:14 +08:00
|
|
|
// As far as I know, there is no way to check if a vswprintf-call failed because of a badly
|
|
|
|
// formated string option or because the supplied destination string was to small. In GLIBC,
|
|
|
|
// errno seems to be set to EINVAL either way.
|
|
|
|
//
|
|
|
|
// Because of this, on failiure we try to increase the buffer size until the free space is
|
|
|
|
// larger than max_size, at which point it will conclude that the error was probably due to a
|
|
|
|
// badly formated string option, and return an error. Make sure to null terminate string before
|
|
|
|
// that, though.
|
|
|
|
const size_t max_size = (128 * 1024 * 1024);
|
2012-03-04 11:12:06 +08:00
|
|
|
wchar_t static_buff[256];
|
|
|
|
size_t size = 0;
|
|
|
|
wchar_t *buff = NULL;
|
|
|
|
int status = -1;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (status < 0) {
|
|
|
|
// Reallocate if necessary.
|
|
|
|
if (size == 0) {
|
2012-03-04 11:12:06 +08:00
|
|
|
buff = static_buff;
|
|
|
|
size = sizeof static_buff;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-03-04 11:12:06 +08:00
|
|
|
size *= 2;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (size >= max_size) {
|
2012-03-04 11:12:06 +08:00
|
|
|
buff[0] = '\0';
|
|
|
|
break;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
buff = (wchar_t *)realloc((buff == static_buff ? NULL : buff), size);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (buff == NULL) {
|
2012-03-04 11:12:06 +08:00
|
|
|
DIE_MEM();
|
|
|
|
}
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Try printing.
|
2012-11-19 08:30:30 +08:00
|
|
|
va_list va;
|
|
|
|
va_copy(va, va_orig);
|
2012-03-04 11:12:06 +08:00
|
|
|
status = vswprintf(buff, size / sizeof(wchar_t), format, va);
|
2012-11-19 08:30:30 +08:00
|
|
|
va_end(va);
|
2012-03-04 11:12:06 +08:00
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2014-05-01 07:29:52 +08:00
|
|
|
target.append(buff);
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (buff != static_buff) {
|
2012-03-04 11:12:06 +08:00
|
|
|
free(buff);
|
2014-05-01 07:29:52 +08:00
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-04 11:12:06 +08:00
|
|
|
errno = saved_err;
|
2011-12-27 11:18:46 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring vformat_string(const wchar_t *format, va_list va_orig) {
|
2014-05-01 07:29:52 +08:00
|
|
|
wcstring result;
|
|
|
|
append_formatv(result, format, va_orig);
|
|
|
|
return result;
|
2013-03-25 06:24:29 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void append_format(wcstring &str, const wchar_t *format, ...) {
|
2012-11-19 08:30:30 +08:00
|
|
|
va_list va;
|
|
|
|
va_start(va, format);
|
2013-03-25 06:24:29 +08:00
|
|
|
append_formatv(str, format, va);
|
2012-11-19 08:30:30 +08:00
|
|
|
va_end(va);
|
2012-02-23 02:51:06 +08:00
|
|
|
}
|
2012-02-10 10:43:36 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wchar_t *quote_end(const wchar_t *pos) {
|
2012-11-19 08:30:30 +08:00
|
|
|
wchar_t c = *pos;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while (1) {
|
2012-11-19 08:30:30 +08:00
|
|
|
pos++;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!*pos) return 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (*pos == L'\\') {
|
2012-11-19 08:30:30 +08:00
|
|
|
pos++;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!*pos) return 0;
|
|
|
|
} else {
|
|
|
|
if (*pos == c) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return (wchar_t *)pos;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return 0;
|
|
|
|
}
|
|
|
|
|
2016-06-04 10:05:13 +08:00
|
|
|
void fish_setlocale() {
|
2016-04-28 07:10:14 +08:00
|
|
|
// Use ellipsis if on known unicode system, otherwise use $.
|
2016-06-15 08:16:18 +08:00
|
|
|
ellipsis_char = (fish_wcwidth(L'\x2026') > 0) ? L'\x2026' : L'$';
|
2012-12-03 18:25:08 +08:00
|
|
|
|
2012-12-02 07:44:09 +08:00
|
|
|
// U+23CE is the "return" character
|
2016-06-15 08:16:18 +08:00
|
|
|
omitted_newline_char = (fish_wcwidth(L'\x23CE') > 0) ? L'\x23CE' : L'~';
|
2005-09-20 21:26:39 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool contains_internal(const wchar_t *a, int vararg_handle, ...) {
|
2012-11-19 08:30:30 +08:00
|
|
|
const wchar_t *arg;
|
|
|
|
va_list va;
|
|
|
|
bool res = false;
|
|
|
|
|
|
|
|
CHECK(a, 0);
|
2006-05-03 00:28:30 +08:00
|
|
|
|
2014-03-10 09:43:40 +08:00
|
|
|
va_start(va, vararg_handle);
|
2016-04-28 07:10:14 +08:00
|
|
|
while ((arg = va_arg(va, const wchar_t *)) != 0) {
|
|
|
|
if (wcscmp(a, arg) == 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
res = true;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
va_end(va);
|
|
|
|
return res;
|
2012-01-31 01:46:33 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// wcstring variant of contains_internal. The first parameter is a wcstring, the rest are const
|
|
|
|
/// wchar_t *. vararg_handle exists only to give us a POD-value to pass to va_start.
|
|
|
|
__sentinel bool contains_internal(const wcstring &needle, int vararg_handle, ...) {
|
2012-11-19 08:30:30 +08:00
|
|
|
const wchar_t *arg;
|
|
|
|
va_list va;
|
|
|
|
int res = 0;
|
|
|
|
|
2014-03-10 09:43:40 +08:00
|
|
|
const wchar_t *needle_cstr = needle.c_str();
|
|
|
|
va_start(va, vararg_handle);
|
2016-04-28 07:10:14 +08:00
|
|
|
while ((arg = va_arg(va, const wchar_t *)) != 0) {
|
|
|
|
// libc++ has an unfortunate implementation of operator== that unconditonally wcslen's the
|
|
|
|
// wchar_t* parameter, so prefer wcscmp directly.
|
|
|
|
if (!wcscmp(needle_cstr, arg)) {
|
|
|
|
res = 1;
|
2012-11-19 08:30:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
va_end(va);
|
|
|
|
return res;
|
2005-09-20 21:26:39 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
long read_blocked(int fd, void *buf, size_t count) {
|
2012-11-19 08:30:30 +08:00
|
|
|
ssize_t res;
|
|
|
|
sigset_t chldset, oldset;
|
2005-09-20 21:26:39 +08:00
|
|
|
|
2012-11-19 08:30:30 +08:00
|
|
|
sigemptyset(&chldset);
|
|
|
|
sigaddset(&chldset, SIGCHLD);
|
|
|
|
VOMIT_ON_FAILURE(pthread_sigmask(SIG_BLOCK, &chldset, &oldset));
|
|
|
|
res = read(fd, buf, count);
|
|
|
|
VOMIT_ON_FAILURE(pthread_sigmask(SIG_SETMASK, &oldset, NULL));
|
|
|
|
return res;
|
2005-09-20 21:26:39 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
ssize_t write_loop(int fd, const char *buff, size_t count) {
|
|
|
|
size_t out_cum = 0;
|
|
|
|
while (out_cum < count) {
|
2013-01-05 14:32:40 +08:00
|
|
|
ssize_t out = write(fd, &buff[out_cum], count - out_cum);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (out < 0) {
|
|
|
|
if (errno != EAGAIN && errno != EINTR) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return -1;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-11-19 08:30:30 +08:00
|
|
|
out_cum += (size_t)out;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return (ssize_t)out_cum;
|
2009-02-23 04:28:52 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
ssize_t read_loop(int fd, void *buff, size_t count) {
|
2012-03-01 09:55:28 +08:00
|
|
|
ssize_t result;
|
2016-04-28 07:10:14 +08:00
|
|
|
do {
|
2012-03-01 09:55:28 +08:00
|
|
|
result = read(fd, buff, count);
|
2016-04-28 07:10:14 +08:00
|
|
|
} while (result < 0 && (errno == EAGAIN || errno == EINTR));
|
2012-03-01 09:55:28 +08:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
static bool should_debug(int level) {
|
|
|
|
if (level > debug_level) return false;
|
2005-09-20 21:26:39 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Hack to not print error messages in the tests.
|
|
|
|
if (program_name && !wcscmp(program_name, L"(ignore)")) return false;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-07-18 03:47:01 +08:00
|
|
|
return true;
|
|
|
|
}
|
2006-05-31 23:40:28 +08:00
|
|
|
|
2016-05-16 10:45:02 +08:00
|
|
|
static void debug_shared(const wchar_t level, const wcstring &msg) {
|
|
|
|
pid_t current_pid = getpid();
|
|
|
|
|
|
|
|
if (current_pid == initial_pid) {
|
|
|
|
fwprintf(stderr, L"<%lc> %ls: %ls\n", (unsigned long)level, program_name, msg.c_str());
|
|
|
|
} else {
|
|
|
|
fwprintf(stderr, L"<%lc> %ls: %d: %ls\n", (unsigned long)level, program_name, current_pid,
|
|
|
|
msg.c_str());
|
|
|
|
}
|
2012-07-18 03:47:01 +08:00
|
|
|
}
|
2006-05-31 23:40:28 +08:00
|
|
|
|
2016-05-16 10:45:02 +08:00
|
|
|
static wchar_t level_char[] = {L'E', L'W', L'2', L'3', L'4', L'5'};
|
|
|
|
void __attribute__((noinline)) debug(int level, const wchar_t *msg, ...) {
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!should_debug(level)) return;
|
2012-07-18 03:47:01 +08:00
|
|
|
int errno_old = errno;
|
|
|
|
va_list va;
|
2012-11-19 08:30:30 +08:00
|
|
|
va_start(va, msg);
|
2012-07-18 03:47:01 +08:00
|
|
|
wcstring local_msg = vformat_string(msg, va);
|
2012-11-19 08:30:30 +08:00
|
|
|
va_end(va);
|
2016-05-16 10:45:02 +08:00
|
|
|
const wchar_t msg_level = level <= 5 ? level_char[level] : L'9';
|
|
|
|
debug_shared(msg_level, local_msg);
|
|
|
|
if (debug_stack_frames > 0) {
|
|
|
|
show_stackframe(msg_level, debug_stack_frames, 1);
|
|
|
|
}
|
2012-07-18 03:47:01 +08:00
|
|
|
errno = errno_old;
|
|
|
|
}
|
|
|
|
|
2016-05-16 10:45:02 +08:00
|
|
|
void __attribute__((noinline)) debug(int level, const char *msg, ...) {
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!should_debug(level)) return;
|
2012-07-18 03:47:01 +08:00
|
|
|
int errno_old = errno;
|
|
|
|
char local_msg[512];
|
|
|
|
va_list va;
|
2012-11-19 08:30:30 +08:00
|
|
|
va_start(va, msg);
|
2012-07-18 03:47:01 +08:00
|
|
|
vsnprintf(local_msg, sizeof local_msg, msg, va);
|
2012-11-19 08:30:30 +08:00
|
|
|
va_end(va);
|
2016-05-16 10:45:02 +08:00
|
|
|
const wchar_t msg_level = level <= 5 ? level_char[level] : L'9';
|
|
|
|
debug_shared(msg_level, str2wcstring(local_msg));
|
|
|
|
if (debug_stack_frames > 0) {
|
|
|
|
show_stackframe(msg_level, debug_stack_frames, 1);
|
|
|
|
}
|
2012-07-18 03:47:01 +08:00
|
|
|
errno = errno_old;
|
2012-02-23 02:51:06 +08:00
|
|
|
}
|
2006-01-15 19:58:05 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void read_ignore(int fd, void *buff, size_t count) {
|
2014-04-28 09:27:34 +08:00
|
|
|
size_t ignore __attribute__((unused));
|
|
|
|
ignore = read(fd, buff, count);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void write_ignore(int fd, const void *buff, size_t count) {
|
2014-04-28 09:27:34 +08:00
|
|
|
size_t ignore __attribute__((unused));
|
|
|
|
ignore = write(fd, buff, count);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void debug_safe(int level, const char *msg, const char *param1, const char *param2,
|
|
|
|
const char *param3, const char *param4, const char *param5, const char *param6,
|
|
|
|
const char *param7, const char *param8, const char *param9, const char *param10,
|
|
|
|
const char *param11, const char *param12) {
|
|
|
|
const char *const params[] = {param1, param2, param3, param4, param5, param6,
|
|
|
|
param7, param8, param9, param10, param11, param12};
|
|
|
|
if (!msg) return;
|
2012-07-18 03:47:01 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Can't call printf, that may allocate memory Just call write() over and over.
|
|
|
|
if (level > debug_level) return;
|
2012-03-01 03:27:14 +08:00
|
|
|
int errno_old = errno;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t param_idx = 0;
|
|
|
|
const char *cursor = msg;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (*cursor != '\0') {
|
2012-03-01 03:27:14 +08:00
|
|
|
const char *end = strchr(cursor, '%');
|
2016-04-28 07:10:14 +08:00
|
|
|
if (end == NULL) end = cursor + strlen(cursor);
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2014-04-28 09:27:34 +08:00
|
|
|
write_ignore(STDERR_FILENO, cursor, end - cursor);
|
2012-03-01 03:27:14 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (end[0] == '%' && end[1] == 's') {
|
|
|
|
// Handle a format string.
|
2012-03-09 15:21:07 +08:00
|
|
|
assert(param_idx < sizeof params / sizeof *params);
|
|
|
|
const char *format = params[param_idx++];
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!format) format = "(null)";
|
2014-04-28 09:27:34 +08:00
|
|
|
write_ignore(STDERR_FILENO, format, strlen(format));
|
2012-03-01 03:27:14 +08:00
|
|
|
cursor = end + 2;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (end[0] == '\0') {
|
|
|
|
// Must be at the end of the string.
|
2012-03-01 03:27:14 +08:00
|
|
|
cursor = end;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
// Some other format specifier, just skip it.
|
2012-03-01 03:27:14 +08:00
|
|
|
cursor = end + 1;
|
|
|
|
}
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// We always append a newline.
|
2014-04-28 09:27:34 +08:00
|
|
|
write_ignore(STDERR_FILENO, "\n", 1);
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-01 03:27:14 +08:00
|
|
|
errno = errno_old;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void format_long_safe(char buff[64], long val) {
|
|
|
|
if (val == 0) {
|
2012-03-01 03:27:14 +08:00
|
|
|
strcpy(buff, "0");
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
// Generate the string in reverse.
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t idx = 0;
|
|
|
|
bool negative = (val < 0);
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Note that we can't just negate val if it's negative, because it may be the most negative
|
|
|
|
// value. We do rely on round-towards-zero division though.
|
|
|
|
while (val != 0) {
|
2012-03-04 07:20:30 +08:00
|
|
|
long rem = val % 10;
|
|
|
|
buff[idx++] = '0' + (rem < 0 ? -rem : rem);
|
2012-03-01 03:27:14 +08:00
|
|
|
val /= 10;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
if (negative) buff[idx++] = '-';
|
2012-03-01 09:55:28 +08:00
|
|
|
buff[idx] = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t left = 0, right = idx - 1;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (left < right) {
|
2012-03-01 03:27:14 +08:00
|
|
|
char tmp = buff[left];
|
|
|
|
buff[left++] = buff[right];
|
|
|
|
buff[right--] = tmp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void format_long_safe(wchar_t buff[64], long val) {
|
|
|
|
if (val == 0) {
|
2012-03-04 07:20:30 +08:00
|
|
|
wcscpy(buff, L"0");
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
// Generate the string in reverse.
|
2012-03-04 07:20:30 +08:00
|
|
|
size_t idx = 0;
|
|
|
|
bool negative = (val < 0);
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while (val != 0) {
|
2012-03-04 07:20:30 +08:00
|
|
|
long rem = val % 10;
|
2012-07-29 08:49:46 +08:00
|
|
|
buff[idx++] = L'0' + (wchar_t)(rem < 0 ? -rem : rem);
|
2012-03-04 07:20:30 +08:00
|
|
|
val /= 10;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
if (negative) buff[idx++] = L'-';
|
2012-03-04 07:20:30 +08:00
|
|
|
buff[idx] = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-04 07:20:30 +08:00
|
|
|
size_t left = 0, right = idx - 1;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (left < right) {
|
2012-03-04 07:20:30 +08:00
|
|
|
wchar_t tmp = buff[left];
|
|
|
|
buff[left++] = buff[right];
|
|
|
|
buff[right--] = tmp;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void narrow_string_safe(char buff[64], const wchar_t *s) {
|
2016-02-28 17:38:28 +08:00
|
|
|
size_t idx = 0;
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t widx = 0; s[widx] != L'\0'; widx++) {
|
2016-02-28 17:38:28 +08:00
|
|
|
wchar_t c = s[widx];
|
2016-04-28 07:10:14 +08:00
|
|
|
if (c <= 127) {
|
2016-02-28 17:38:28 +08:00
|
|
|
buff[idx++] = char(c);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (idx + 1 == 64) {
|
2016-02-28 17:38:28 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
buff[idx] = '\0';
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring reformat_for_screen(const wcstring &msg) {
|
2015-09-22 02:24:49 +08:00
|
|
|
wcstring buff;
|
2012-11-19 08:30:30 +08:00
|
|
|
int line_width = 0;
|
|
|
|
int screen_width = common_get_width();
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (screen_width) {
|
2014-01-13 05:33:35 +08:00
|
|
|
const wchar_t *start = msg.c_str();
|
|
|
|
const wchar_t *pos = start;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (1) {
|
2012-11-19 08:30:30 +08:00
|
|
|
int overflow = 0;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int tok_width = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Tokenize on whitespace, and also calculate the width of the token.
|
|
|
|
while (*pos && (!wcschr(L" \n\r\t", *pos))) {
|
|
|
|
// Check is token is wider than one line. If so we mark it as an overflow and break
|
|
|
|
// the token.
|
|
|
|
if ((tok_width + fish_wcwidth(*pos)) > (screen_width - 1)) {
|
2012-11-19 08:30:30 +08:00
|
|
|
overflow = 1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
|
|
|
tok_width += fish_wcwidth(*pos);
|
|
|
|
pos++;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// If token is zero character long, we don't do anything.
|
|
|
|
if (pos == start) {
|
2016-06-15 10:21:50 +08:00
|
|
|
pos = pos + 1;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (overflow) {
|
|
|
|
// In case of overflow, we print a newline, except if we already are at position 0.
|
|
|
|
wchar_t *token = wcsndup(start, pos - start);
|
|
|
|
if (line_width != 0) buff.push_back(L'\n');
|
2012-02-23 02:51:06 +08:00
|
|
|
buff.append(format_string(L"%ls-\n", token));
|
2012-11-19 08:30:30 +08:00
|
|
|
free(token);
|
2016-04-28 07:10:14 +08:00
|
|
|
line_width = 0;
|
|
|
|
} else {
|
|
|
|
// Print the token.
|
|
|
|
wchar_t *token = wcsndup(start, pos - start);
|
|
|
|
if ((line_width + (line_width != 0 ? 1 : 0) + tok_width) > screen_width) {
|
2012-02-23 02:51:06 +08:00
|
|
|
buff.push_back(L'\n');
|
2016-04-28 07:10:14 +08:00
|
|
|
line_width = 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
buff.append(format_string(L"%ls%ls", line_width ? L" " : L"", token));
|
2012-11-19 08:30:30 +08:00
|
|
|
free(token);
|
2016-04-28 07:10:14 +08:00
|
|
|
line_width += (line_width != 0 ? 1 : 0) + tok_width;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Break on end of string.
|
|
|
|
if (!*pos) {
|
2012-11-19 08:30:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
start = pos;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-02-23 02:51:06 +08:00
|
|
|
buff.append(msg);
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2012-02-23 02:51:06 +08:00
|
|
|
buff.push_back(L'\n');
|
2015-09-22 02:24:49 +08:00
|
|
|
return buff;
|
2006-01-15 19:58:05 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Escape a string, storing the result in out_str.
|
|
|
|
static void escape_string_internal(const wchar_t *orig_in, size_t in_len, wcstring *out_str,
|
|
|
|
escape_flags_t flags) {
|
2014-01-09 07:06:09 +08:00
|
|
|
assert(orig_in != NULL);
|
2005-10-14 19:40:33 +08:00
|
|
|
|
2014-01-09 07:06:09 +08:00
|
|
|
const wchar_t *in = orig_in;
|
2016-10-21 12:14:40 +08:00
|
|
|
bool escape_all = static_cast<bool>(flags & ESCAPE_ALL);
|
|
|
|
bool no_quoted = static_cast<bool>(flags & ESCAPE_NO_QUOTED);
|
|
|
|
bool no_tilde = static_cast<bool>(flags & ESCAPE_NO_TILDE);
|
2005-10-14 19:40:33 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int need_escape = 0;
|
|
|
|
int need_complex_escape = 0;
|
2005-10-14 19:40:33 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Avoid dereferencing all over the place.
|
2014-01-09 07:06:09 +08:00
|
|
|
wcstring &out = *out_str;
|
2011-12-27 15:13:05 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!no_quoted && in_len == 0) {
|
2014-01-09 07:06:09 +08:00
|
|
|
out.assign(L"''");
|
|
|
|
return;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2012-05-09 17:33:42 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while (*in != 0) {
|
|
|
|
if ((*in >= ENCODE_DIRECT_BASE) && (*in < ENCODE_DIRECT_BASE + 256)) {
|
2012-11-19 08:30:30 +08:00
|
|
|
int val = *in - ENCODE_DIRECT_BASE;
|
|
|
|
int tmp;
|
2012-05-14 11:49:14 +08:00
|
|
|
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'X';
|
2012-02-27 12:11:34 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
tmp = val / 16;
|
|
|
|
out += tmp > 9 ? L'a' + (tmp - 10) : L'0' + tmp;
|
2006-10-19 19:50:23 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
tmp = val % 16;
|
|
|
|
out += tmp > 9 ? L'a' + (tmp - 10) : L'0' + tmp;
|
|
|
|
need_escape = need_complex_escape = 1;
|
2006-11-17 22:58:25 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-11-19 08:30:30 +08:00
|
|
|
wchar_t c = *in;
|
2016-04-28 07:10:14 +08:00
|
|
|
switch (c) {
|
|
|
|
case L'\t': {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L't';
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case L'\n': {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'n';
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case L'\b': {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'b';
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case L'\r': {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'r';
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case L'\x1b': {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'e';
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
2012-11-19 16:31:03 +08:00
|
|
|
case L'\\':
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\'': {
|
|
|
|
need_escape = need_complex_escape = 1;
|
|
|
|
if (escape_all) out += L'\\';
|
2014-01-09 07:06:09 +08:00
|
|
|
out += *in;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case ANY_CHAR: {
|
|
|
|
// Experimental fix for #1614. The hope is that any time these appear in a
|
|
|
|
// string, they came from wildcard expansion.
|
2014-08-17 10:25:36 +08:00
|
|
|
out += L'?';
|
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case ANY_STRING: {
|
2014-08-17 10:25:36 +08:00
|
|
|
out += L'*';
|
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
|
|
|
case ANY_STRING_RECURSIVE: {
|
2014-08-17 10:25:36 +08:00
|
|
|
out += L"**";
|
|
|
|
break;
|
2016-04-28 07:10:14 +08:00
|
|
|
}
|
2012-11-19 16:31:03 +08:00
|
|
|
case L'&':
|
|
|
|
case L'$':
|
|
|
|
case L' ':
|
|
|
|
case L'#':
|
|
|
|
case L'^':
|
|
|
|
case L'<':
|
|
|
|
case L'>':
|
|
|
|
case L'(':
|
|
|
|
case L')':
|
|
|
|
case L'[':
|
|
|
|
case L']':
|
|
|
|
case L'{':
|
|
|
|
case L'}':
|
|
|
|
case L'?':
|
|
|
|
case L'*':
|
|
|
|
case L'|':
|
|
|
|
case L';':
|
|
|
|
case L'"':
|
|
|
|
case L'%':
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'~': {
|
|
|
|
if (!no_tilde || c != L'~') {
|
|
|
|
need_escape = 1;
|
|
|
|
if (escape_all) out += L'\\';
|
2012-11-19 16:31:03 +08:00
|
|
|
}
|
2014-01-09 07:06:09 +08:00
|
|
|
out += *in;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
default: {
|
|
|
|
if (*in < 32) {
|
|
|
|
if (*in < 27 && *in > 0) {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'c';
|
2016-04-28 07:10:14 +08:00
|
|
|
out += L'a' + *in - 1;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
need_escape = need_complex_escape = 1;
|
2012-11-19 16:31:03 +08:00
|
|
|
break;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int tmp = (*in) % 16;
|
2014-01-09 07:06:09 +08:00
|
|
|
out += L'\\';
|
|
|
|
out += L'x';
|
2016-04-28 07:10:14 +08:00
|
|
|
out += ((*in > 15) ? L'1' : L'0');
|
|
|
|
out += tmp > 9 ? L'a' + (tmp - 10) : L'0' + tmp;
|
|
|
|
need_escape = need_complex_escape = 1;
|
|
|
|
} else {
|
2014-01-09 07:06:09 +08:00
|
|
|
out += *in;
|
2012-11-19 16:31:03 +08:00
|
|
|
}
|
|
|
|
break;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
in++;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Use quoted escaping if possible, since most people find it easier to read.
|
|
|
|
if (!no_quoted && need_escape && !need_complex_escape && escape_all) {
|
2014-01-09 07:06:09 +08:00
|
|
|
wchar_t single_quote = L'\'';
|
|
|
|
out.clear();
|
|
|
|
out.reserve(2 + in_len);
|
|
|
|
out.push_back(single_quote);
|
|
|
|
out.append(orig_in, in_len);
|
|
|
|
out.push_back(single_quote);
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2014-01-09 07:06:09 +08:00
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring escape(const wchar_t *in, escape_flags_t flags) {
|
2014-09-26 09:20:03 +08:00
|
|
|
wcstring result;
|
|
|
|
escape_string_internal(in, wcslen(in), &result, flags);
|
|
|
|
return result;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring escape_string(const wcstring &in, escape_flags_t flags) {
|
2014-01-09 07:06:09 +08:00
|
|
|
wcstring result;
|
|
|
|
escape_string_internal(in.c_str(), in.size(), &result, flags);
|
2012-11-19 08:30:30 +08:00
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Helper to return the last character in a string, or NOT_A_WCHAR.
|
|
|
|
static wint_t string_last_char(const wcstring &str) {
|
2013-11-25 14:57:49 +08:00
|
|
|
size_t len = str.size();
|
|
|
|
return len == 0 ? NOT_A_WCHAR : str.at(len - 1);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Given a null terminated string starting with a backslash, read the escape as if it is unquoted,
|
|
|
|
/// appending to result. Return the number of characters consumed, or 0 on error.
|
|
|
|
size_t read_unquoted_escape(const wchar_t *input, wcstring *result, bool allow_incomplete,
|
|
|
|
bool unescape_special) {
|
|
|
|
if (input[0] != L'\\') {
|
|
|
|
return 0; // not an escape
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Here's the character we'll ultimately append, or NOT_A_WCHAR for none. Note that L'\0' is a
|
|
|
|
// valid thing to append.
|
2014-05-14 13:30:41 +08:00
|
|
|
wint_t result_char_or_none = NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
|
|
|
|
bool errored = false;
|
2016-04-28 07:10:14 +08:00
|
|
|
size_t in_pos = 1; // in_pos always tracks the next character to read (and therefore the number
|
|
|
|
// of characters read so far)
|
2013-11-25 14:57:49 +08:00
|
|
|
const wchar_t c = input[in_pos++];
|
2016-04-28 07:10:14 +08:00
|
|
|
switch (c) {
|
|
|
|
// A null character after a backslash is an error.
|
|
|
|
case L'\0': {
|
|
|
|
// Adjust in_pos to only include the backslash.
|
2013-11-25 14:57:49 +08:00
|
|
|
assert(in_pos > 0);
|
|
|
|
in_pos--;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// It's an error, unless we're allowing incomplete escapes.
|
|
|
|
if (!allow_incomplete) errored = true;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// Numeric escape sequences. No prefix means octal escape, otherwise hexadecimal.
|
2013-11-25 14:57:49 +08:00
|
|
|
case L'0':
|
|
|
|
case L'1':
|
|
|
|
case L'2':
|
|
|
|
case L'3':
|
|
|
|
case L'4':
|
|
|
|
case L'5':
|
|
|
|
case L'6':
|
|
|
|
case L'7':
|
|
|
|
case L'u':
|
|
|
|
case L'U':
|
|
|
|
case L'x':
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'X': {
|
|
|
|
long long res = 0;
|
|
|
|
size_t chars = 2;
|
|
|
|
int base = 16;
|
2013-11-25 14:57:49 +08:00
|
|
|
bool byte_literal = false;
|
|
|
|
wchar_t max_val = ASCII_MAX;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
switch (c) {
|
|
|
|
case L'u': {
|
|
|
|
chars = 4;
|
2013-11-25 14:57:49 +08:00
|
|
|
max_val = UCS2_MAX;
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'U': {
|
|
|
|
chars = 8;
|
2013-11-25 14:57:49 +08:00
|
|
|
max_val = WCHAR_MAX;
|
2014-01-15 17:40:40 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Don't exceed the largest Unicode code point - see #1107.
|
|
|
|
if (0x10FFFF < max_val) max_val = (wchar_t)0x10FFFF;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'x': {
|
2013-11-25 14:57:49 +08:00
|
|
|
chars = 2;
|
|
|
|
max_val = ASCII_MAX;
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'X': {
|
2013-11-25 14:57:49 +08:00
|
|
|
byte_literal = true;
|
|
|
|
max_val = BYTE_MAX;
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
default: {
|
|
|
|
base = 8;
|
|
|
|
chars = 3;
|
|
|
|
// Note that in_pos currently is just after the first post-backslash character;
|
|
|
|
// we want to start our escape from there.
|
2013-11-25 14:57:49 +08:00
|
|
|
assert(in_pos > 0);
|
|
|
|
in_pos--;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t i = 0; i < chars; i++) {
|
|
|
|
long d = convert_digit(input[in_pos], base);
|
|
|
|
if (d < 0) {
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
res = (res * base) + d;
|
2013-11-25 14:57:49 +08:00
|
|
|
in_pos++;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (res <= max_val) {
|
|
|
|
result_char_or_none = (wchar_t)((byte_literal ? ENCODE_DIRECT_BASE : 0) + res);
|
|
|
|
} else {
|
2013-11-25 14:57:49 +08:00
|
|
|
errored = true;
|
|
|
|
}
|
|
|
|
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \a means bell (alert).
|
|
|
|
case L'a': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\a';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \b means backspace.
|
|
|
|
case L'b': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\b';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \cX means control sequence X.
|
|
|
|
case L'c': {
|
2013-11-25 14:57:49 +08:00
|
|
|
const wchar_t sequence_char = input[in_pos++];
|
2016-04-28 07:10:14 +08:00
|
|
|
if (sequence_char >= L'a' && sequence_char <= (L'a' + 32)) {
|
|
|
|
result_char_or_none = sequence_char - L'a' + 1;
|
|
|
|
} else if (sequence_char >= L'A' && sequence_char <= (L'A' + 32)) {
|
|
|
|
result_char_or_none = sequence_char - L'A' + 1;
|
|
|
|
} else {
|
2013-11-25 14:57:49 +08:00
|
|
|
errored = true;
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \x1b means escape.
|
|
|
|
case L'e': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\x1b';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \f means form feed.
|
|
|
|
case L'f': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\f';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \n means newline.
|
|
|
|
case L'n': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\n';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \r means carriage return.
|
|
|
|
case L'r': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\r';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \t means tab.
|
|
|
|
case L't': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\t';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// \v means vertical tab.
|
|
|
|
case L'v': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = L'\v';
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// If a backslash is followed by an actual newline, swallow them both.
|
|
|
|
case L'\n': {
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
default: {
|
|
|
|
if (unescape_special) result->push_back(INTERNAL_SEPARATOR);
|
2014-05-14 13:30:41 +08:00
|
|
|
result_char_or_none = c;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!errored && result_char_or_none != NOT_A_WCHAR) {
|
2014-05-14 13:30:41 +08:00
|
|
|
wchar_t result_char = static_cast<wchar_t>(result_char_or_none);
|
2016-04-28 07:10:14 +08:00
|
|
|
// If result_char is not NOT_A_WCHAR, it must be a valid wchar.
|
2014-05-14 13:30:41 +08:00
|
|
|
assert((wint_t)result_char == result_char_or_none);
|
2013-11-25 14:57:49 +08:00
|
|
|
result->push_back(result_char);
|
|
|
|
}
|
|
|
|
return errored ? 0 : in_pos;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Returns the unescaped version of input_str into output_str (by reference). Returns true if
|
|
|
|
/// successful. If false, the contents of output_str are undefined (!).
|
|
|
|
static bool unescape_string_internal(const wchar_t *const input, const size_t input_len,
|
|
|
|
wcstring *output_str, unescape_flags_t flags) {
|
|
|
|
// Set up result string, which we'll swap with the output on success.
|
2013-11-25 14:57:49 +08:00
|
|
|
wcstring result;
|
|
|
|
result.reserve(input_len);
|
|
|
|
|
2016-10-21 12:14:40 +08:00
|
|
|
const bool unescape_special = static_cast<bool>(flags & UNESCAPE_SPECIAL);
|
|
|
|
const bool allow_incomplete = static_cast<bool>(flags & UNESCAPE_INCOMPLETE);
|
2013-11-25 14:57:49 +08:00
|
|
|
|
|
|
|
int bracket_count = 0;
|
|
|
|
|
|
|
|
bool errored = false;
|
2016-04-28 07:10:14 +08:00
|
|
|
enum { mode_unquoted, mode_single_quotes, mode_double_quotes } mode = mode_unquoted;
|
2013-11-25 14:57:49 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t input_position = 0; input_position < input_len && !errored; input_position++) {
|
2013-11-25 14:57:49 +08:00
|
|
|
const wchar_t c = input[input_position];
|
2016-04-28 07:10:14 +08:00
|
|
|
// Here's the character we'll append to result, or NOT_A_WCHAR to suppress it.
|
2014-05-14 13:30:41 +08:00
|
|
|
wint_t to_append_or_none = c;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (mode == mode_unquoted) {
|
|
|
|
switch (c) {
|
|
|
|
case L'\\': {
|
|
|
|
// Backslashes (escapes) are complicated and may result in errors, or appending
|
|
|
|
// INTERNAL_SEPARATORs, so we have to handle them specially.
|
|
|
|
size_t escape_chars = read_unquoted_escape(input + input_position, &result,
|
|
|
|
allow_incomplete, unescape_special);
|
|
|
|
if (escape_chars == 0) {
|
|
|
|
// A 0 return indicates an error.
|
2013-11-25 14:57:49 +08:00
|
|
|
errored = true;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
// Skip over the characters we read, minus one because the outer loop will
|
|
|
|
// increment it.
|
2013-11-25 14:57:49 +08:00
|
|
|
assert(escape_chars > 0);
|
|
|
|
input_position += escape_chars - 1;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
// We've already appended, don't append anything else.
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'~': {
|
|
|
|
if (unescape_special && (input_position == 0)) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = HOME_DIRECTORY;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'%': {
|
|
|
|
if (unescape_special && (input_position == 0)) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = PROCESS_EXPAND;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'*': {
|
|
|
|
if (unescape_special) {
|
|
|
|
// In general, this is ANY_STRING. But as a hack, if the last appended char
|
|
|
|
// is ANY_STRING, delete the last char and store ANY_STRING_RECURSIVE to
|
|
|
|
// reflect the fact that ** is the recursive wildcard.
|
|
|
|
if (string_last_char(result) == ANY_STRING) {
|
2013-11-25 14:57:49 +08:00
|
|
|
assert(result.size() > 0);
|
|
|
|
result.resize(result.size() - 1);
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = ANY_STRING_RECURSIVE;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = ANY_STRING;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'?': {
|
|
|
|
if (unescape_special) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = ANY_CHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'$': {
|
|
|
|
if (unescape_special) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = VARIABLE_EXPAND;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'{': {
|
|
|
|
if (unescape_special) {
|
2013-11-25 14:57:49 +08:00
|
|
|
bracket_count++;
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = BRACKET_BEGIN;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'}': {
|
|
|
|
if (unescape_special) {
|
2013-11-25 14:57:49 +08:00
|
|
|
bracket_count--;
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = BRACKET_END;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L',': {
|
|
|
|
// If the last character was a separator, then treat this as a literal comma.
|
|
|
|
if (unescape_special && bracket_count > 0 &&
|
|
|
|
string_last_char(result) != BRACKET_SEP) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = BRACKET_SEP;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\'': {
|
2013-11-25 14:57:49 +08:00
|
|
|
mode = mode_single_quotes;
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = unescape_special ? INTERNAL_SEPARATOR : NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\"': {
|
2013-11-25 14:57:49 +08:00
|
|
|
mode = mode_double_quotes;
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = unescape_special ? INTERNAL_SEPARATOR : NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (mode == mode_single_quotes) {
|
|
|
|
if (c == L'\\') {
|
|
|
|
// A backslash may or may not escape something in single quotes.
|
|
|
|
switch (input[input_position + 1]) {
|
2013-11-25 14:57:49 +08:00
|
|
|
case '\\':
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\'': {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = input[input_position + 1];
|
2016-04-28 07:10:14 +08:00
|
|
|
input_position += 1; // skip over the backslash
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case L'\0': {
|
|
|
|
if (!allow_incomplete) {
|
2013-11-25 14:57:49 +08:00
|
|
|
errored = true;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
// PCA this line had the following cryptic comment: 'We may ever escape
|
|
|
|
// a NULL character, but still appending a \ in case I am wrong.' Not
|
|
|
|
// sure what it means or the importance of this.
|
2013-11-25 14:57:49 +08:00
|
|
|
input_position += 1; /* Skip over the backslash */
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = L'\\';
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
break;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
default: {
|
|
|
|
// Literal backslash that doesn't escape anything! Leave things alone; we'll
|
|
|
|
// append the backslash itself.
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (c == L'\'') {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = unescape_special ? INTERNAL_SEPARATOR : NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
mode = mode_unquoted;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (mode == mode_double_quotes) {
|
|
|
|
switch (c) {
|
|
|
|
case L'"': {
|
2013-11-25 14:57:49 +08:00
|
|
|
mode = mode_unquoted;
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = unescape_special ? INTERNAL_SEPARATOR : NOT_A_WCHAR;
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case '\\': {
|
|
|
|
switch (input[input_position + 1]) {
|
|
|
|
case L'\0': {
|
|
|
|
if (!allow_incomplete) {
|
2013-11-25 14:57:49 +08:00
|
|
|
errored = true;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = L'\0';
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
break;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
case '\\':
|
|
|
|
case L'$':
|
2016-04-28 07:10:14 +08:00
|
|
|
case '"': {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = input[input_position + 1];
|
2013-11-25 14:57:49 +08:00
|
|
|
input_position += 1; /* Skip over the backslash */
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case '\n': {
|
2013-11-25 14:57:49 +08:00
|
|
|
/* Swallow newline */
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = NOT_A_WCHAR;
|
2013-11-26 17:39:16 +08:00
|
|
|
input_position += 1; /* Skip over the backslash */
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
default: {
|
|
|
|
/* Literal backslash that doesn't escape anything! Leave things alone;
|
|
|
|
* we'll append the backslash itself */
|
2013-11-25 14:57:49 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
case '$': {
|
|
|
|
if (unescape_special) {
|
2014-05-14 13:30:41 +08:00
|
|
|
to_append_or_none = VARIABLE_EXPAND_SINGLE;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Now maybe append the char.
|
|
|
|
if (to_append_or_none != NOT_A_WCHAR) {
|
2014-05-14 13:30:41 +08:00
|
|
|
wchar_t to_append_char = static_cast<wchar_t>(to_append_or_none);
|
2016-04-28 07:10:14 +08:00
|
|
|
// If result_char is not NOT_A_WCHAR, it must be a valid wchar.
|
2014-05-14 13:30:41 +08:00
|
|
|
assert((wint_t)to_append_char == to_append_or_none);
|
|
|
|
result.push_back(to_append_char);
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Return the string by reference, and then success.
|
|
|
|
if (!errored) {
|
2013-11-25 14:57:49 +08:00
|
|
|
output_str->swap(result);
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
return !errored;
|
2013-11-25 14:57:49 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool unescape_string_in_place(wcstring *str, unescape_flags_t escape_special) {
|
2013-11-25 14:57:49 +08:00
|
|
|
assert(str != NULL);
|
|
|
|
wcstring output;
|
|
|
|
bool success = unescape_string_internal(str->c_str(), str->size(), &output, escape_special);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (success) {
|
2013-11-25 14:57:49 +08:00
|
|
|
str->swap(output);
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
return success;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool unescape_string(const wchar_t *input, wcstring *output, unescape_flags_t escape_special) {
|
2013-11-25 14:57:49 +08:00
|
|
|
bool success = unescape_string_internal(input, wcslen(input), output, escape_special);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!success) output->clear();
|
2013-11-25 14:57:49 +08:00
|
|
|
return success;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool unescape_string(const wcstring &input, wcstring *output, unescape_flags_t escape_special) {
|
2013-11-25 14:57:49 +08:00
|
|
|
bool success = unescape_string_internal(input.c_str(), input.size(), output, escape_special);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!success) output->clear();
|
2013-11-25 14:57:49 +08:00
|
|
|
return success;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void common_handle_winch(int signal) {
|
|
|
|
// Don't run ioctl() here, it's not safe to use in signals.
|
2016-10-10 05:38:26 +08:00
|
|
|
UNUSED(signal);
|
2014-08-24 15:59:03 +08:00
|
|
|
termsize_valid = false;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Updates termsize as needed, and returns a copy of the winsize.
|
|
|
|
static struct winsize get_current_winsize() {
|
2014-08-24 15:59:03 +08:00
|
|
|
#ifndef HAVE_WINSIZE
|
|
|
|
struct winsize retval = {0};
|
|
|
|
retval.ws_col = 80;
|
|
|
|
retval.ws_row = 24;
|
|
|
|
return retval;
|
|
|
|
#endif
|
|
|
|
scoped_rwlock guard(termsize_rwlock, true);
|
|
|
|
struct winsize retval = termsize;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!termsize_valid) {
|
2014-08-24 15:59:03 +08:00
|
|
|
struct winsize size;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (ioctl(1, TIOCGWINSZ, &size) == 0) {
|
2014-08-24 15:59:03 +08:00
|
|
|
retval = size;
|
|
|
|
guard.upgrade();
|
|
|
|
termsize = retval;
|
|
|
|
}
|
|
|
|
termsize_valid = true;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
2014-08-24 15:59:03 +08:00
|
|
|
return retval;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int common_get_width() { return get_current_winsize().ws_col; }
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int common_get_height() { return get_current_winsize().ws_row; }
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void tokenize_variable_array(const wcstring &val, std::vector<wcstring> &out) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t pos = 0, end = val.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
while (pos <= end) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t next_pos = val.find(ARRAY_SEP, pos);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (next_pos == wcstring::npos) {
|
2014-02-25 01:54:30 +08:00
|
|
|
next_pos = end;
|
|
|
|
}
|
|
|
|
out.resize(out.size() + 1);
|
|
|
|
out.back().assign(val, pos, next_pos - pos);
|
2016-04-28 07:10:14 +08:00
|
|
|
pos = next_pos + 1; // skip the separator, or skip past the end
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool string_prefixes_string(const wchar_t *proposed_prefix, const wcstring &value) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t prefix_size = wcslen(proposed_prefix);
|
|
|
|
return prefix_size <= value.size() && value.compare(0, prefix_size, proposed_prefix) == 0;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool string_prefixes_string(const wcstring &proposed_prefix, const wcstring &value) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t prefix_size = proposed_prefix.size();
|
|
|
|
return prefix_size <= value.size() && value.compare(0, prefix_size, proposed_prefix) == 0;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool string_prefixes_string_case_insensitive(const wcstring &proposed_prefix,
|
|
|
|
const wcstring &value) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t prefix_size = proposed_prefix.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
return prefix_size <= value.size() &&
|
|
|
|
wcsncasecmp(proposed_prefix.c_str(), value.c_str(), prefix_size) == 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool string_suffixes_string(const wcstring &proposed_suffix, const wcstring &value) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t suffix_size = proposed_suffix.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
return suffix_size <= value.size() &&
|
|
|
|
value.compare(value.size() - suffix_size, suffix_size, proposed_suffix) == 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool string_suffixes_string(const wchar_t *proposed_suffix, const wcstring &value) {
|
2012-11-19 08:30:30 +08:00
|
|
|
size_t suffix_size = wcslen(proposed_suffix);
|
2016-04-28 07:10:14 +08:00
|
|
|
return suffix_size <= value.size() &&
|
|
|
|
value.compare(value.size() - suffix_size, suffix_size, proposed_suffix) == 0;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Returns true if seq, represented as a subsequence, is contained within string.
|
|
|
|
static bool subsequence_in_string(const wcstring &seq, const wcstring &str) {
|
|
|
|
// Impossible if seq is larger than string.
|
|
|
|
if (seq.size() > str.size()) {
|
2013-05-26 06:41:18 +08:00
|
|
|
return false;
|
|
|
|
}
|
2013-06-02 16:14:26 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Empty strings are considered to be subsequences of everything.
|
|
|
|
if (seq.empty()) {
|
2013-05-26 06:41:18 +08:00
|
|
|
return true;
|
|
|
|
}
|
2013-06-02 16:14:26 +08:00
|
|
|
|
2013-05-26 06:41:18 +08:00
|
|
|
size_t str_idx, seq_idx;
|
2016-04-28 07:10:14 +08:00
|
|
|
for (seq_idx = str_idx = 0; seq_idx < seq.size() && str_idx < str.size(); seq_idx++) {
|
2013-05-26 06:41:18 +08:00
|
|
|
wchar_t c = seq.at(seq_idx);
|
|
|
|
size_t char_loc = str.find(c, str_idx);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (char_loc == wcstring::npos) {
|
|
|
|
break; // didn't find this character
|
|
|
|
} else {
|
|
|
|
str_idx = char_loc + 1; // we found it, continue the search just after it
|
2013-05-26 06:41:18 +08:00
|
|
|
}
|
|
|
|
}
|
2013-06-02 16:14:26 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// We succeeded if we exhausted our sequence.
|
2013-05-26 06:41:18 +08:00
|
|
|
assert(seq_idx <= seq.size());
|
|
|
|
return seq_idx == seq.size();
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
string_fuzzy_match_t::string_fuzzy_match_t(enum fuzzy_match_type_t t, size_t distance_first,
|
|
|
|
size_t distance_second)
|
|
|
|
: type(t), match_distance_first(distance_first), match_distance_second(distance_second) {}
|
2013-05-26 06:41:18 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
string_fuzzy_match_t string_fuzzy_match_string(const wcstring &string,
|
|
|
|
const wcstring &match_against,
|
|
|
|
fuzzy_match_type_t limit_type) {
|
|
|
|
// Distances are generally the amount of text not matched.
|
2013-05-26 06:41:18 +08:00
|
|
|
string_fuzzy_match_t result(fuzzy_match_none, 0, 0);
|
|
|
|
size_t location;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (limit_type >= fuzzy_match_exact && string == match_against) {
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_exact;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (limit_type >= fuzzy_match_prefix && string_prefixes_string(string, match_against)) {
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_prefix;
|
|
|
|
assert(match_against.size() >= string.size());
|
|
|
|
result.match_distance_first = match_against.size() - string.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (limit_type >= fuzzy_match_case_insensitive &&
|
|
|
|
wcscasecmp(string.c_str(), match_against.c_str()) == 0) {
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_case_insensitive;
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (limit_type >= fuzzy_match_prefix_case_insensitive &&
|
|
|
|
string_prefixes_string_case_insensitive(string, match_against)) {
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_prefix_case_insensitive;
|
|
|
|
assert(match_against.size() >= string.size());
|
|
|
|
result.match_distance_first = match_against.size() - string.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (limit_type >= fuzzy_match_substring &&
|
|
|
|
(location = match_against.find(string)) != wcstring::npos) {
|
|
|
|
// String is contained within match against.
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_substring;
|
|
|
|
assert(match_against.size() >= string.size());
|
|
|
|
result.match_distance_first = match_against.size() - string.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
result.match_distance_second = location; // prefer earlier matches
|
|
|
|
} else if (limit_type >= fuzzy_match_subsequence_insertions_only &&
|
|
|
|
subsequence_in_string(string, match_against)) {
|
2013-05-26 06:41:18 +08:00
|
|
|
result.type = fuzzy_match_subsequence_insertions_only;
|
|
|
|
assert(match_against.size() >= string.size());
|
|
|
|
result.match_distance_first = match_against.size() - string.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
// It would be nice to prefer matches with greater matching runs here.
|
2013-05-26 06:41:18 +08:00
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
template <typename T>
|
|
|
|
static inline int compare_ints(T a, T b) {
|
2013-05-26 06:41:18 +08:00
|
|
|
if (a < b) return -1;
|
|
|
|
if (a == b) return 0;
|
|
|
|
return 1;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Compare types; if the types match, compare distances.
|
|
|
|
int string_fuzzy_match_t::compare(const string_fuzzy_match_t &rhs) const {
|
|
|
|
if (this->type != rhs.type) {
|
2013-05-26 06:41:18 +08:00
|
|
|
return compare_ints(this->type, rhs.type);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (this->match_distance_first != rhs.match_distance_first) {
|
2013-05-26 06:41:18 +08:00
|
|
|
return compare_ints(this->match_distance_first, rhs.match_distance_first);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (this->match_distance_second != rhs.match_distance_second) {
|
2013-05-26 06:41:18 +08:00
|
|
|
return compare_ints(this->match_distance_second, rhs.match_distance_second);
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
return 0; // equal
|
2013-05-26 06:41:18 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool list_contains_string(const wcstring_list_t &list, const wcstring &str) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return std::find(list.begin(), list.end(), str) != list.end();
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
int create_directory(const wcstring &d) {
|
2012-11-19 08:30:30 +08:00
|
|
|
int ok = 0;
|
|
|
|
struct stat buf;
|
|
|
|
int stat_res = 0;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
while ((stat_res = wstat(d, &buf)) != 0) {
|
|
|
|
if (errno != EAGAIN) break;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (stat_res == 0) {
|
|
|
|
if (S_ISDIR(buf.st_mode)) {
|
2012-11-19 08:30:30 +08:00
|
|
|
ok = 1;
|
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
if (errno == ENOENT) {
|
2012-11-19 08:30:30 +08:00
|
|
|
wcstring dir = wdirname(d);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!create_directory(dir)) {
|
|
|
|
if (!wmkdir(d, 0700)) {
|
2012-11-19 08:30:30 +08:00
|
|
|
ok = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
return ok ? 0 : -1;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
__attribute__((noinline)) void bugreport() {
|
2016-05-16 10:45:02 +08:00
|
|
|
debug(1, _(L"This is a bug. Break on bugreport to debug. "
|
2016-04-28 07:10:14 +08:00
|
|
|
L"If you can reproduce it, please send a bug report to %s."),
|
2012-11-19 08:30:30 +08:00
|
|
|
PACKAGE_BUGREPORT);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstring format_size(long long sz) {
|
2012-11-19 08:30:30 +08:00
|
|
|
wcstring result;
|
2016-04-28 07:10:14 +08:00
|
|
|
const wchar_t *sz_name[] = {L"kB", L"MB", L"GB", L"TB", L"PB", L"EB", L"ZB", L"YB", 0};
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
if (sz < 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
result.append(L"unknown");
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (sz < 1) {
|
2012-11-19 08:30:30 +08:00
|
|
|
result.append(_(L"empty"));
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (sz < 1024) {
|
2012-11-19 08:30:30 +08:00
|
|
|
result.append(format_string(L"%lldB", sz));
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-11-19 08:30:30 +08:00
|
|
|
int i;
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
for (i = 0; sz_name[i]; i++) {
|
|
|
|
if (sz < (1024 * 1024) || !sz_name[i + 1]) {
|
|
|
|
long isz = ((long)sz) / 1024;
|
2012-11-19 08:30:30 +08:00
|
|
|
if (isz > 9)
|
|
|
|
result.append(format_string(L"%d%ls", isz, sz_name[i]));
|
|
|
|
else
|
2016-04-28 07:10:14 +08:00
|
|
|
result.append(format_string(L"%.1f%ls", (double)sz / 1024, sz_name[i]));
|
2012-11-19 08:30:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
sz /= 1024;
|
|
|
|
}
|
|
|
|
}
|
2012-02-10 02:14:06 +08:00
|
|
|
return result;
|
2007-10-15 17:51:08 +08:00
|
|
|
}
|
2009-02-03 06:46:45 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Crappy function to extract the most significant digit of an unsigned long long value.
|
|
|
|
static char extract_most_significant_digit(unsigned long long *xp) {
|
2012-03-01 03:27:14 +08:00
|
|
|
unsigned long long place_value = 1;
|
|
|
|
unsigned long long x = *xp;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (x >= 10) {
|
2012-03-01 03:27:14 +08:00
|
|
|
x /= 10;
|
|
|
|
place_value *= 10;
|
|
|
|
}
|
|
|
|
*xp -= (place_value * x);
|
|
|
|
return x + '0';
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void append_ull(char *buff, unsigned long long val, size_t *inout_idx, size_t max_len) {
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t idx = *inout_idx;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (val > 0 && idx < max_len) buff[idx++] = extract_most_significant_digit(&val);
|
2012-03-01 03:27:14 +08:00
|
|
|
*inout_idx = idx;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void append_str(char *buff, const char *str, size_t *inout_idx, size_t max_len) {
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t idx = *inout_idx;
|
2016-04-28 07:10:14 +08:00
|
|
|
while (*str && idx < max_len) buff[idx++] = *str++;
|
2012-03-01 03:27:14 +08:00
|
|
|
*inout_idx = idx;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void format_size_safe(char buff[128], unsigned long long sz) {
|
2012-03-01 03:27:14 +08:00
|
|
|
const size_t buff_size = 128;
|
2016-04-28 07:10:14 +08:00
|
|
|
const size_t max_len = buff_size - 1; // need to leave room for a null terminator
|
2014-12-08 14:17:44 +08:00
|
|
|
memset(buff, 0, buff_size);
|
2012-03-01 03:27:14 +08:00
|
|
|
size_t idx = 0;
|
2016-04-28 07:10:14 +08:00
|
|
|
const char *const sz_name[] = {"kB", "MB", "GB", "TB", "PB", "EB", "ZB", "YB", NULL};
|
|
|
|
if (sz < 1) {
|
2012-03-01 03:27:14 +08:00
|
|
|
strncpy(buff, "empty", buff_size);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (sz < 1024) {
|
2012-03-01 03:27:14 +08:00
|
|
|
append_ull(buff, sz, &idx, max_len);
|
|
|
|
append_str(buff, "B", &idx, max_len);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
for (size_t i = 0; sz_name[i]; i++) {
|
|
|
|
if (sz < (1024 * 1024) || !sz_name[i + 1]) {
|
|
|
|
unsigned long long isz = sz / 1024;
|
|
|
|
if (isz > 9) {
|
2012-03-01 03:27:14 +08:00
|
|
|
append_ull(buff, isz, &idx, max_len);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
|
|
|
if (isz == 0) {
|
2012-03-01 03:27:14 +08:00
|
|
|
append_str(buff, "0", &idx, max_len);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-03-01 03:27:14 +08:00
|
|
|
append_ull(buff, isz, &idx, max_len);
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Maybe append a single fraction digit.
|
2012-03-01 03:27:14 +08:00
|
|
|
unsigned long long remainder = sz % 1024;
|
2016-04-28 07:10:14 +08:00
|
|
|
if (remainder > 0) {
|
2012-03-01 03:27:14 +08:00
|
|
|
char tmp[3] = {'.', extract_most_significant_digit(&remainder), 0};
|
|
|
|
append_str(buff, tmp, &idx, max_len);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
append_str(buff, sz_name[i], &idx, max_len);
|
2012-11-19 08:30:30 +08:00
|
|
|
break;
|
|
|
|
}
|
|
|
|
sz /= 1024;
|
|
|
|
}
|
2012-03-01 03:27:14 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-06-25 10:25:48 +08:00
|
|
|
/// Return the number of seconds from the UNIX epoch, with subsecond precision. This function uses
|
|
|
|
/// the gettimeofday function and will have the same precision as that function.
|
2016-04-28 07:10:14 +08:00
|
|
|
double timef() {
|
2012-11-19 08:30:30 +08:00
|
|
|
struct timeval tv;
|
2016-06-25 10:25:48 +08:00
|
|
|
VOMIT_ON_FAILURE(gettimeofday(&tv, 0));
|
|
|
|
// return (double)tv.tv_sec + 0.000001 * tv.tv_usec;
|
|
|
|
return (double)tv.tv_sec + 1e-6 * tv.tv_usec;
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void exit_without_destructors(int code) { _exit(code); }
|
2012-02-29 07:11:46 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
/// Helper function to convert from a null_terminated_array_t<wchar_t> to a
|
|
|
|
/// null_terminated_array_t<char_t>.
|
|
|
|
void convert_wide_array_to_narrow(const null_terminated_array_t<wchar_t> &wide_arr,
|
|
|
|
null_terminated_array_t<char> *output) {
|
2012-03-01 03:27:14 +08:00
|
|
|
const wchar_t *const *arr = wide_arr.get();
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!arr) {
|
2013-02-23 08:22:56 +08:00
|
|
|
output->clear();
|
|
|
|
return;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-01 03:27:14 +08:00
|
|
|
std::vector<std::string> list;
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t i = 0; arr[i]; i++) {
|
2012-03-01 03:27:14 +08:00
|
|
|
list.push_back(wcs2string(arr[i]));
|
|
|
|
}
|
2013-02-23 08:22:56 +08:00
|
|
|
output->set(list);
|
2012-03-01 03:27:14 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void append_path_component(wcstring &path, const wcstring &component) {
|
|
|
|
if (path.empty() || component.empty()) {
|
2012-05-09 17:33:42 +08:00
|
|
|
path.append(component);
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2012-05-09 17:33:42 +08:00
|
|
|
size_t path_len = path.size();
|
2016-04-28 07:10:14 +08:00
|
|
|
bool path_slash = path.at(path_len - 1) == L'/';
|
2012-05-09 17:33:42 +08:00
|
|
|
bool comp_slash = component.at(0) == L'/';
|
2016-04-28 07:10:14 +08:00
|
|
|
if (!path_slash && !comp_slash) {
|
2012-05-09 17:33:42 +08:00
|
|
|
// Need a slash
|
|
|
|
path.push_back(L'/');
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (path_slash && comp_slash) {
|
|
|
|
// Too many slashes.
|
2012-05-09 17:33:42 +08:00
|
|
|
path.erase(path_len - 1, 1);
|
|
|
|
}
|
2011-12-27 11:18:46 +08:00
|
|
|
path.append(component);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
extern "C" {
|
2016-04-28 07:10:14 +08:00
|
|
|
__attribute__((noinline)) void debug_thread_error(void) {
|
|
|
|
while (1) sleep(9999999);
|
2011-12-27 11:18:46 +08:00
|
|
|
}
|
2012-01-06 05:58:48 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void set_main_thread() { main_thread_id = pthread_self(); }
|
|
|
|
|
|
|
|
void configure_thread_assertions_for_testing(void) {
|
2012-05-14 11:19:02 +08:00
|
|
|
thread_assertions_configured_for_testing = true;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool is_forked_child(void) {
|
|
|
|
// Just bail if nobody's called setup_fork_guards, e.g. some of our tools.
|
|
|
|
if (!initial_pid) return false;
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2012-03-07 06:34:18 +08:00
|
|
|
bool is_child_of_fork = (getpid() != initial_pid);
|
2016-04-28 07:10:14 +08:00
|
|
|
if (is_child_of_fork) {
|
2012-03-01 03:27:14 +08:00
|
|
|
printf("Uh-oh: %d\n", getpid());
|
|
|
|
while (1) sleep(10000);
|
|
|
|
}
|
2012-02-28 10:43:24 +08:00
|
|
|
return is_child_of_fork;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void setup_fork_guards(void) {
|
|
|
|
// Notice when we fork by stashing our pid. This seems simpler than pthread_atfork().
|
2012-03-07 06:34:18 +08:00
|
|
|
initial_pid = getpid();
|
2012-02-28 10:43:24 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void save_term_foreground_process_group(void) {
|
2012-11-18 18:16:14 +08:00
|
|
|
initial_foreground_process_group = tcgetpgrp(STDIN_FILENO);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void restore_term_foreground_process_group(void) {
|
|
|
|
if (initial_foreground_process_group != -1) {
|
|
|
|
// This is called during shutdown and from a signal handler. We don't bother to complain on
|
|
|
|
// failure.
|
|
|
|
tcsetpgrp(STDIN_FILENO, initial_foreground_process_group);
|
2012-11-18 18:16:14 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool is_main_thread() {
|
2012-11-19 08:30:30 +08:00
|
|
|
assert(main_thread_id != 0);
|
|
|
|
return main_thread_id == pthread_self();
|
2012-01-06 05:58:48 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void assert_is_main_thread(const char *who) {
|
|
|
|
if (!is_main_thread() && !thread_assertions_configured_for_testing) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"Warning: %s called off of main thread. Break on debug_thread_error to debug.\n",
|
|
|
|
who);
|
2011-12-27 11:18:46 +08:00
|
|
|
debug_thread_error();
|
2012-02-28 10:43:24 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void assert_is_not_forked_child(const char *who) {
|
|
|
|
if (is_forked_child()) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"Warning: %s called in a forked child. Break on debug_thread_error to debug.\n",
|
|
|
|
who);
|
2012-02-28 10:43:24 +08:00
|
|
|
debug_thread_error();
|
2011-12-27 11:18:46 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void assert_is_background_thread(const char *who) {
|
|
|
|
if (is_main_thread() && !thread_assertions_configured_for_testing) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"Warning: %s called on the main thread (may block!). Break on debug_thread_error "
|
|
|
|
"to debug.\n",
|
|
|
|
who);
|
2011-12-27 11:18:46 +08:00
|
|
|
debug_thread_error();
|
2012-02-25 04:13:35 +08:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void assert_is_locked(void *vmutex, const char *who, const char *caller) {
|
|
|
|
pthread_mutex_t *mutex = static_cast<pthread_mutex_t *>(vmutex);
|
|
|
|
if (0 == pthread_mutex_trylock(mutex)) {
|
|
|
|
fprintf(stderr,
|
|
|
|
"Warning: %s is not locked when it should be in '%s'. Break on debug_thread_error "
|
|
|
|
"to debug.\n",
|
|
|
|
who, caller);
|
2012-02-25 04:13:35 +08:00
|
|
|
debug_thread_error();
|
|
|
|
pthread_mutex_unlock(mutex);
|
|
|
|
}
|
2011-12-27 11:18:46 +08:00
|
|
|
}
|
2012-02-28 10:43:24 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_lock::lock(void) {
|
|
|
|
assert(!locked);
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_mutex_lock(lock_obj));
|
2012-02-28 10:43:24 +08:00
|
|
|
locked = true;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_lock::unlock(void) {
|
2012-02-28 10:43:24 +08:00
|
|
|
assert(locked);
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_mutex_unlock(lock_obj));
|
2012-02-28 10:43:24 +08:00
|
|
|
locked = false;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_lock::scoped_lock(pthread_mutex_t &mutex) : lock_obj(&mutex), locked(false) { this->lock(); }
|
2012-02-28 10:43:24 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_lock::scoped_lock(mutex_lock_t &lock) : lock_obj(&lock.mutex), locked(false) {
|
2014-05-05 06:06:40 +08:00
|
|
|
this->lock();
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_lock::~scoped_lock() {
|
2012-02-28 10:43:24 +08:00
|
|
|
if (locked) this->unlock();
|
|
|
|
}
|
2012-07-21 05:33:08 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_rwlock::lock(void) {
|
|
|
|
assert(!(locked || locked_shared));
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_rdlock(rwlock_obj));
|
|
|
|
locked = true;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_rwlock::unlock(void) {
|
2014-08-24 15:59:03 +08:00
|
|
|
assert(locked);
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_unlock(rwlock_obj));
|
|
|
|
locked = false;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_rwlock::lock_shared(void) {
|
|
|
|
assert(!(locked || locked_shared));
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_wrlock(rwlock_obj));
|
|
|
|
locked_shared = true;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_rwlock::unlock_shared(void) {
|
2014-08-24 15:59:03 +08:00
|
|
|
assert(locked_shared);
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_unlock(rwlock_obj));
|
|
|
|
locked_shared = false;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
void scoped_rwlock::upgrade(void) {
|
2014-08-24 15:59:03 +08:00
|
|
|
assert(locked_shared);
|
2016-05-16 10:45:02 +08:00
|
|
|
ASSERT_IS_NOT_FORKED_CHILD();
|
2014-08-24 15:59:03 +08:00
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_unlock(rwlock_obj));
|
|
|
|
locked = false;
|
|
|
|
VOMIT_ON_FAILURE_NO_ERRNO(pthread_rwlock_wrlock(rwlock_obj));
|
|
|
|
locked_shared = true;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_rwlock::scoped_rwlock(pthread_rwlock_t &rwlock, bool shared)
|
|
|
|
: rwlock_obj(&rwlock), locked(false), locked_shared(false) {
|
|
|
|
if (shared) {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->lock_shared();
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->lock();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_rwlock::scoped_rwlock(rwlock_t &rwlock, bool shared)
|
|
|
|
: rwlock_obj(&rwlock.rwlock), locked(false), locked_shared(false) {
|
|
|
|
if (shared) {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->lock_shared();
|
2016-04-28 07:10:14 +08:00
|
|
|
} else {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->lock();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
scoped_rwlock::~scoped_rwlock() {
|
|
|
|
if (locked) {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->unlock();
|
2016-04-28 07:10:14 +08:00
|
|
|
} else if (locked_shared) {
|
2014-08-24 15:59:03 +08:00
|
|
|
this->unlock_shared();
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstokenizer::wcstokenizer(const wcstring &s, const wcstring &separator)
|
|
|
|
: buffer(), str(), state(), sep(separator) {
|
2012-07-21 05:33:08 +08:00
|
|
|
buffer = wcsdup(s.c_str());
|
|
|
|
str = buffer;
|
|
|
|
state = NULL;
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
bool wcstokenizer::next(wcstring &result) {
|
2012-07-21 05:33:08 +08:00
|
|
|
wchar_t *tmp = wcstok(str, sep.c_str(), &state);
|
|
|
|
str = NULL;
|
|
|
|
if (tmp) result = tmp;
|
|
|
|
return tmp != NULL;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wcstokenizer::~wcstokenizer() { free(buffer); }
|
2013-02-23 08:22:56 +08:00
|
|
|
|
|
|
|
template <typename CharType_t>
|
2016-04-28 07:10:14 +08:00
|
|
|
static CharType_t **make_null_terminated_array_helper(
|
|
|
|
const std::vector<std::basic_string<CharType_t> > &argv) {
|
2013-02-23 08:22:56 +08:00
|
|
|
size_t count = argv.size();
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// We allocate everything in one giant block. First compute how much space we need.
|
|
|
|
// N + 1 pointers.
|
2013-02-23 08:22:56 +08:00
|
|
|
size_t pointers_allocation_len = (count + 1) * sizeof(CharType_t *);
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// In the very unlikely event that CharType_t has stricter alignment requirements than does a
|
|
|
|
// pointer, round us up to the size of a CharType_t.
|
2013-02-23 08:22:56 +08:00
|
|
|
pointers_allocation_len += sizeof(CharType_t) - 1;
|
|
|
|
pointers_allocation_len -= pointers_allocation_len % sizeof(CharType_t);
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// N null terminated strings.
|
2013-02-23 08:22:56 +08:00
|
|
|
size_t strings_allocation_len = 0;
|
2016-04-28 07:10:14 +08:00
|
|
|
for (size_t i = 0; i < count; i++) {
|
|
|
|
// The size of the string, plus a null terminator.
|
2013-02-23 08:22:56 +08:00
|
|
|
strings_allocation_len += (argv.at(i).size() + 1) * sizeof(CharType_t);
|
|
|
|
}
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Now allocate their sum.
|
|
|
|
unsigned char *base =
|
|
|
|
static_cast<unsigned char *>(malloc(pointers_allocation_len + strings_allocation_len));
|
|
|
|
if (!base) return NULL;
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Divvy it up into the pointers and strings.
|
2013-02-23 08:22:56 +08:00
|
|
|
CharType_t **pointers = reinterpret_cast<CharType_t **>(base);
|
|
|
|
CharType_t *strings = reinterpret_cast<CharType_t *>(base + pointers_allocation_len);
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Start copying.
|
|
|
|
for (size_t i = 0; i < count; i++) {
|
2013-02-23 08:22:56 +08:00
|
|
|
const std::basic_string<CharType_t> &str = argv.at(i);
|
2016-04-28 07:10:14 +08:00
|
|
|
*pointers++ = strings; // store the current string pointer into self
|
|
|
|
strings = std::copy(str.begin(), str.end(), strings); // copy the string into strings
|
|
|
|
*strings++ = (CharType_t)(0); // each string needs a null terminator
|
2013-02-23 08:22:56 +08:00
|
|
|
}
|
2016-04-28 07:10:14 +08:00
|
|
|
*pointers++ = NULL; // array of pointers needs a null terminator
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
// Make sure we know what we're doing.
|
2013-02-24 04:47:10 +08:00
|
|
|
assert((unsigned char *)pointers - base == (std::ptrdiff_t)pointers_allocation_len);
|
2016-04-28 07:10:14 +08:00
|
|
|
assert((unsigned char *)strings - (unsigned char *)pointers ==
|
|
|
|
(std::ptrdiff_t)strings_allocation_len);
|
|
|
|
assert((unsigned char *)strings - base ==
|
|
|
|
(std::ptrdiff_t)(pointers_allocation_len + strings_allocation_len));
|
2013-02-24 04:47:10 +08:00
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
return reinterpret_cast<CharType_t **>(base);
|
2013-02-23 08:22:56 +08:00
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
wchar_t **make_null_terminated_array(const wcstring_list_t &lst) {
|
2013-02-23 08:22:56 +08:00
|
|
|
return make_null_terminated_array_helper(lst);
|
|
|
|
}
|
|
|
|
|
2016-04-28 07:10:14 +08:00
|
|
|
char **make_null_terminated_array(const std::vector<std::string> &lst) {
|
2013-02-23 08:22:56 +08:00
|
|
|
return make_null_terminated_array_helper(lst);
|
|
|
|
}
|
2016-05-17 05:30:31 +08:00
|
|
|
|
|
|
|
long convert_digit(wchar_t d, int base) {
|
|
|
|
long res = -1;
|
|
|
|
if ((d <= L'9') && (d >= L'0')) {
|
|
|
|
res = d - L'0';
|
|
|
|
} else if ((d <= L'z') && (d >= L'a')) {
|
|
|
|
res = d + 10 - L'a';
|
|
|
|
} else if ((d <= L'Z') && (d >= L'A')) {
|
|
|
|
res = d + 10 - L'A';
|
|
|
|
}
|
|
|
|
if (res >= base) {
|
|
|
|
res = -1;
|
|
|
|
}
|
|
|
|
|
|
|
|
return res;
|
|
|
|
}
|
2016-10-18 07:23:29 +08:00
|
|
|
|
|
|
|
// Test if the specified character is in a range that fish uses interally to store special tokens.
|
|
|
|
//
|
|
|
|
// NOTE: This is used when tokenizing the input. It is also used when reading input, before
|
|
|
|
// tokenization, to replace such chars with REPLACEMENT_WCHAR if they're not part of a quoted
|
|
|
|
// string. We don't want external input to be able to feed reserved characters into our lexer/parser
|
|
|
|
// or code evaluator.
|
|
|
|
//
|
|
|
|
// TODO: Actually implement the replacement as documented above.
|
|
|
|
bool fish_reserved_codepoint(wchar_t c) {
|
|
|
|
return (c >= RESERVED_CHAR_BASE && c < RESERVED_CHAR_END) ||
|
|
|
|
(c >= ENCODE_DIRECT_BASE && c < ENCODE_DIRECT_END) ||
|
|
|
|
(c >= INPUT_COMMON_BASE && c < INPUT_COMMON_END);
|
|
|
|
}
|