2016-04-30 10:01:36 +08:00
|
|
|
// This file only contains fallback implementations of functions which have been found to be missing
|
|
|
|
// or broken by the configuration scripts.
|
|
|
|
//
|
|
|
|
// Many of these functions are more or less broken and incomplete. lrand28_r internally uses the
|
|
|
|
// regular (bad) rand_r function, the gettext function doesn't actually do anything, etc.
|
2006-02-28 21:17:16 +08:00
|
|
|
#include "config.h"
|
|
|
|
|
2016-04-21 14:00:54 +08:00
|
|
|
// IWYU likes to recommend adding term.h when we want ncurses.h.
|
|
|
|
// IWYU pragma: no_include term.h
|
2016-04-30 10:01:36 +08:00
|
|
|
#include <assert.h> // IWYU pragma: keep
|
|
|
|
#include <dirent.h> // IWYU pragma: keep
|
|
|
|
#include <errno.h> // IWYU pragma: keep
|
|
|
|
#include <fcntl.h> // IWYU pragma: keep
|
|
|
|
#include <limits.h> // IWYU pragma: keep
|
|
|
|
#include <stdarg.h> // IWYU pragma: keep
|
|
|
|
#include <stdio.h> // IWYU pragma: keep
|
2006-02-28 21:17:16 +08:00
|
|
|
#include <stdlib.h>
|
2016-04-30 10:01:36 +08:00
|
|
|
#include <string.h>
|
|
|
|
#include <sys/stat.h> // IWYU pragma: keep
|
2016-04-21 14:00:54 +08:00
|
|
|
#include <sys/types.h> // IWYU pragma: keep
|
2016-04-30 10:01:36 +08:00
|
|
|
#include <unistd.h>
|
2006-02-28 21:17:16 +08:00
|
|
|
#include <wchar.h>
|
|
|
|
#include <wctype.h>
|
2013-04-17 12:41:58 +08:00
|
|
|
#if HAVE_GETTEXT
|
|
|
|
#include <libintl.h>
|
|
|
|
#endif
|
2006-02-28 21:17:16 +08:00
|
|
|
#if HAVE_NCURSES_H
|
2016-04-21 14:00:54 +08:00
|
|
|
#include <ncurses.h> // IWYU pragma: keep
|
2014-12-07 16:41:15 +08:00
|
|
|
#elif HAVE_NCURSES_CURSES_H
|
|
|
|
#include <ncurses/curses.h>
|
2006-02-28 21:17:16 +08:00
|
|
|
#else
|
|
|
|
#include <curses.h>
|
|
|
|
#endif
|
|
|
|
#if HAVE_TERM_H
|
2016-04-21 14:00:54 +08:00
|
|
|
#include <term.h> // IWYU pragma: keep
|
2006-02-28 21:17:16 +08:00
|
|
|
#elif HAVE_NCURSES_TERM_H
|
|
|
|
#include <ncurses/term.h>
|
|
|
|
#endif
|
2016-04-21 14:00:54 +08:00
|
|
|
#include <signal.h> // IWYU pragma: keep
|
2016-04-30 10:01:36 +08:00
|
|
|
#include <wchar.h> // IWYU pragma: keep
|
2006-02-28 21:17:16 +08:00
|
|
|
|
2016-10-10 05:38:26 +08:00
|
|
|
#include "common.h" // IWYU pragma: keep
|
2016-04-21 14:00:54 +08:00
|
|
|
#include "fallback.h" // IWYU pragma: keep
|
2016-04-30 10:01:36 +08:00
|
|
|
#include "util.h" // IWYU pragma: keep
|
2006-03-02 19:30:29 +08:00
|
|
|
|
2007-08-22 15:57:41 +08:00
|
|
|
#ifdef TPARM_SOLARIS_KLUDGE
|
|
|
|
#undef tparm
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
/// Checks for known string values and maps to correct number of parameters.
|
|
|
|
char *tparm_solaris_kludge(char *str, ...) {
|
|
|
|
long int param[9] = {};
|
2012-11-19 08:30:30 +08:00
|
|
|
|
|
|
|
va_list ap;
|
|
|
|
va_start(ap, str);
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
if ((set_a_foreground && !strcmp(str, set_a_foreground)) ||
|
|
|
|
(set_a_background && !strcmp(str, set_a_background)) ||
|
|
|
|
(set_foreground && !strcmp(str, set_foreground)) ||
|
|
|
|
(set_background && !strcmp(str, set_background)) ||
|
|
|
|
(enter_underline_mode && !strcmp(str, enter_underline_mode)) ||
|
|
|
|
(exit_underline_mode && !strcmp(str, exit_underline_mode)) ||
|
|
|
|
(enter_standout_mode && !strcmp(str, enter_standout_mode)) ||
|
|
|
|
(exit_standout_mode && !strcmp(str, exit_standout_mode)) ||
|
|
|
|
(flash_screen && !strcmp(str, flash_screen)) ||
|
|
|
|
(enter_subscript_mode && !strcmp(str, enter_subscript_mode)) ||
|
|
|
|
(exit_subscript_mode && !strcmp(str, exit_subscript_mode)) ||
|
|
|
|
(enter_superscript_mode && !strcmp(str, enter_superscript_mode)) ||
|
|
|
|
(exit_superscript_mode && !strcmp(str, exit_superscript_mode)) ||
|
|
|
|
(enter_blink_mode && !strcmp(str, enter_blink_mode)) ||
|
|
|
|
(enter_italics_mode && !strcmp(str, enter_italics_mode)) ||
|
|
|
|
(exit_italics_mode && !strcmp(str, exit_italics_mode)) ||
|
|
|
|
(enter_reverse_mode && !strcmp(str, enter_reverse_mode)) ||
|
|
|
|
(enter_shadow_mode && !strcmp(str, enter_shadow_mode)) ||
|
|
|
|
(exit_shadow_mode && !strcmp(str, exit_shadow_mode)) ||
|
|
|
|
(enter_secure_mode && !strcmp(str, enter_secure_mode)) ||
|
|
|
|
(enter_bold_mode && !strcmp(str, enter_bold_mode))) {
|
2012-11-19 08:30:30 +08:00
|
|
|
param[0] = va_arg(ap, long int);
|
2016-04-30 10:01:36 +08:00
|
|
|
} else if (cursor_address && !strcmp(str, cursor_address)) {
|
2012-11-19 08:30:30 +08:00
|
|
|
param[0] = va_arg(ap, long int);
|
|
|
|
param[1] = va_arg(ap, long int);
|
|
|
|
}
|
|
|
|
|
|
|
|
va_end(ap);
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
return tparm(str, param[0], param[1], param[2], param[3], param[4], param[5], param[6],
|
|
|
|
param[7], param[8]);
|
2007-08-22 15:57:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
// Re-defining just to make sure nothing breaks further down in this file.
|
|
|
|
#define tparm tparm_solaris_kludge
|
|
|
|
|
|
|
|
#endif
|
|
|
|
|
2016-05-29 13:28:26 +08:00
|
|
|
#if __APPLE__
|
2016-04-30 10:01:36 +08:00
|
|
|
/// Fallback implementations of wcsdup and wcscasecmp. On systems where these are not needed (e.g.
|
|
|
|
/// building on Linux) these should end up just being stripped, as they are static functions that
|
|
|
|
/// are not referenced in this file.
|
|
|
|
__attribute__((unused)) static wchar_t *wcsdup_fallback(const wchar_t *in) {
|
|
|
|
size_t len = wcslen(in);
|
|
|
|
wchar_t *out = (wchar_t *)malloc(sizeof(wchar_t) * (len + 1));
|
|
|
|
if (out == 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return 0;
|
|
|
|
}
|
2012-11-18 18:23:22 +08:00
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
memcpy(out, in, sizeof(wchar_t) * (len + 1));
|
2012-11-19 08:30:30 +08:00
|
|
|
return out;
|
2006-02-28 21:17:16 +08:00
|
|
|
}
|
2016-05-29 13:28:26 +08:00
|
|
|
#endif
|
2006-02-28 21:17:16 +08:00
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
__attribute__((unused)) static int wcscasecmp_fallback(const wchar_t *a, const wchar_t *b) {
|
|
|
|
if (*a == 0) {
|
2016-05-05 06:19:47 +08:00
|
|
|
return *b == 0 ? 0 : -1;
|
2016-04-30 10:01:36 +08:00
|
|
|
} else if (*b == 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return 1;
|
|
|
|
}
|
2016-04-30 10:01:36 +08:00
|
|
|
int diff = towlower(*a) - towlower(*b);
|
2016-05-05 06:19:47 +08:00
|
|
|
if (diff != 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return diff;
|
2016-05-05 06:19:47 +08:00
|
|
|
}
|
|
|
|
return wcscasecmp_fallback(a + 1, b + 1);
|
2006-02-28 21:17:16 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
__attribute__((unused)) static int wcsncasecmp_fallback(const wchar_t *a, const wchar_t *b,
|
|
|
|
size_t count) {
|
|
|
|
if (count == 0) return 0;
|
2013-05-17 10:44:21 +08:00
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
if (*a == 0) {
|
2016-05-05 06:19:47 +08:00
|
|
|
return *b == 0 ? 0 : -1;
|
2016-04-30 10:01:36 +08:00
|
|
|
} else if (*b == 0) {
|
2013-05-17 10:44:21 +08:00
|
|
|
return 1;
|
|
|
|
}
|
2016-04-30 10:01:36 +08:00
|
|
|
int diff = towlower(*a) - towlower(*b);
|
2016-05-05 06:19:47 +08:00
|
|
|
if (diff != 0) return diff;
|
|
|
|
return wcsncasecmp_fallback(a + 1, b + 1, count - 1);
|
2013-05-17 10:44:21 +08:00
|
|
|
}
|
|
|
|
|
2016-05-19 08:46:13 +08:00
|
|
|
#if __APPLE__
|
|
|
|
#if __DARWIN_C_LEVEL >= 200809L
|
2016-04-30 10:01:36 +08:00
|
|
|
// Note parens avoid the macro expansion.
|
|
|
|
wchar_t *wcsdup_use_weak(const wchar_t *a) {
|
|
|
|
if (&wcsdup != NULL) return (wcsdup)(a);
|
2012-07-21 05:33:08 +08:00
|
|
|
return wcsdup_fallback(a);
|
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
int wcscasecmp_use_weak(const wchar_t *a, const wchar_t *b) {
|
|
|
|
if (&wcscasecmp != NULL) return (wcscasecmp)(a, b);
|
2012-07-21 05:33:08 +08:00
|
|
|
return wcscasecmp_fallback(a, b);
|
|
|
|
}
|
2012-11-18 18:23:22 +08:00
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
int wcsncasecmp_use_weak(const wchar_t *s1, const wchar_t *s2, size_t n) {
|
|
|
|
if (&wcsncasecmp != NULL) return (wcsncasecmp)(s1, s2, n);
|
2013-05-17 10:44:21 +08:00
|
|
|
return wcsncasecmp_fallback(s1, s2, n);
|
|
|
|
}
|
2016-05-28 05:41:16 +08:00
|
|
|
#else // __DARWIN_C_LEVEL >= 200809L
|
2016-05-19 08:46:13 +08:00
|
|
|
wchar_t *wcsdup(const wchar_t *in) { return wcsdup_fallback(in); }
|
|
|
|
int wcscasecmp(const wchar_t *a, const wchar_t *b) { return wcscasecmp_fallback(a, b); }
|
2016-05-28 05:41:16 +08:00
|
|
|
int wcsncasecmp(const wchar_t *a, const wchar_t *b, size_t n) {
|
|
|
|
return wcsncasecmp_fallback(a, b, n);
|
|
|
|
}
|
|
|
|
#endif // __DARWIN_C_LEVEL >= 200809L
|
2016-05-19 08:46:13 +08:00
|
|
|
#endif // __APPLE__
|
2012-07-21 05:33:08 +08:00
|
|
|
|
2006-02-28 21:17:16 +08:00
|
|
|
#ifndef HAVE_WCSNDUP
|
2016-04-30 10:01:36 +08:00
|
|
|
wchar_t *wcsndup(const wchar_t *in, size_t c) {
|
|
|
|
wchar_t *res = (wchar_t *)malloc(sizeof(wchar_t) * (c + 1));
|
|
|
|
if (res == 0) {
|
2012-11-19 08:30:30 +08:00
|
|
|
return 0;
|
|
|
|
}
|
2016-04-30 10:01:36 +08:00
|
|
|
wcslcpy(res, in, c + 1);
|
2012-11-19 08:30:30 +08:00
|
|
|
return res;
|
2006-02-28 21:17:16 +08:00
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2006-04-19 17:56:28 +08:00
|
|
|
#ifndef HAVE_WCSLCPY
|
|
|
|
/*$OpenBSD: strlcpy.c,v 1.8 2003/06/17 21:56:24 millert Exp $*/
|
|
|
|
|
|
|
|
/*
|
|
|
|
* Copyright (c) 1998 Todd C. Miller <Todd.Miller@courtesan.com>
|
|
|
|
*
|
|
|
|
* Permission to use, copy, modify, and distribute this software for any
|
|
|
|
* purpose with or without fee is hereby granted, provided that the above
|
|
|
|
* copyright notice and this permission notice appear in all copies.
|
|
|
|
*
|
|
|
|
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
|
|
|
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
|
|
|
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
|
|
|
|
* ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
|
|
|
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
|
|
|
|
* ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
|
|
|
|
* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
|
|
|
|
*/
|
2016-04-30 10:01:36 +08:00
|
|
|
size_t wcslcpy(wchar_t *dst, const wchar_t *src, size_t siz) {
|
2012-11-19 08:30:30 +08:00
|
|
|
register wchar_t *d = dst;
|
|
|
|
register const wchar_t *s = src;
|
|
|
|
register size_t n = siz;
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
// Copy as many bytes as will fit.
|
|
|
|
if (n != 0 && --n != 0) {
|
|
|
|
do {
|
|
|
|
if ((*d++ = *s++) == 0) break;
|
|
|
|
} while (--n != 0);
|
2012-11-19 08:30:30 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
// Not enough room in dst, add NUL and traverse rest of src.
|
|
|
|
if (n == 0) {
|
|
|
|
if (siz != 0) *d = '\0';
|
|
|
|
// NUL-terminate dst.
|
2012-11-19 08:30:30 +08:00
|
|
|
while (*s++)
|
|
|
|
;
|
2012-11-18 18:23:22 +08:00
|
|
|
}
|
2016-05-05 06:19:47 +08:00
|
|
|
return s - src - 1;
|
2016-04-30 10:01:36 +08:00
|
|
|
// Count does not include NUL.
|
2006-04-19 17:56:28 +08:00
|
|
|
}
|
|
|
|
#endif
|
2006-02-28 21:17:16 +08:00
|
|
|
|
2006-06-15 18:53:15 +08:00
|
|
|
#ifndef HAVE_LRAND48_R
|
2016-04-30 10:01:36 +08:00
|
|
|
int lrand48_r(struct drand48_data *buffer, long int *result) {
|
2012-11-19 08:30:30 +08:00
|
|
|
*result = rand_r(&buffer->seed);
|
|
|
|
return 0;
|
2006-06-15 18:53:15 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
int srand48_r(long int seedval, struct drand48_data *buffer) {
|
2012-11-19 08:30:30 +08:00
|
|
|
buffer->seed = (unsigned int)seedval;
|
|
|
|
return 0;
|
2006-06-15 18:53:15 +08:00
|
|
|
}
|
|
|
|
#endif
|
2006-06-21 22:15:44 +08:00
|
|
|
|
|
|
|
#ifndef HAVE_FUTIMES
|
2016-04-30 10:01:36 +08:00
|
|
|
int futimes(int fd, const struct timeval *times) {
|
2012-11-19 08:30:30 +08:00
|
|
|
errno = ENOSYS;
|
|
|
|
return -1;
|
2006-06-21 22:15:44 +08:00
|
|
|
}
|
2006-07-20 06:55:49 +08:00
|
|
|
#endif
|
|
|
|
|
2013-04-09 01:20:56 +08:00
|
|
|
#if HAVE_GETTEXT
|
2016-04-30 10:01:36 +08:00
|
|
|
char *fish_gettext(const char *msgid) {
|
|
|
|
return gettext(msgid);
|
|
|
|
;
|
2013-04-09 01:20:56 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
char *fish_bindtextdomain(const char *domainname, const char *dirname) {
|
2013-04-09 01:20:56 +08:00
|
|
|
return bindtextdomain(domainname, dirname);
|
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
char *fish_textdomain(const char *domainname) { return textdomain(domainname); }
|
2013-04-09 01:20:56 +08:00
|
|
|
#else
|
2016-04-30 10:01:36 +08:00
|
|
|
char *fish_gettext(const char *msgid) { return (char *)msgid; }
|
2016-10-10 05:38:26 +08:00
|
|
|
char *fish_bindtextdomain(const char *domainname, const char *dirname) {
|
|
|
|
UNUSED(domainname);
|
|
|
|
UNUSED(dirname);
|
|
|
|
return NULL;
|
|
|
|
}
|
|
|
|
char *fish_textdomain(const char *domainname) {
|
|
|
|
UNUSED(domainname);
|
|
|
|
return NULL;
|
|
|
|
}
|
2006-07-20 07:11:49 +08:00
|
|
|
#endif
|
2006-07-20 06:55:49 +08:00
|
|
|
|
2006-07-31 04:59:41 +08:00
|
|
|
#ifndef HAVE_KILLPG
|
2016-04-30 10:01:36 +08:00
|
|
|
int killpg(int pgr, int sig) {
|
2012-11-19 08:30:30 +08:00
|
|
|
assert(pgr > 1);
|
|
|
|
return kill(-pgr, sig);
|
2006-07-31 04:59:41 +08:00
|
|
|
}
|
|
|
|
#endif
|
2006-08-28 19:43:05 +08:00
|
|
|
|
2016-05-16 07:19:27 +08:00
|
|
|
// Big hack to use our versions of wcswidth where we know them to be broken, which is
|
|
|
|
// EVERYWHERE (https://github.com/fish-shell/fish-shell/issues/2199)
|
2012-07-16 01:45:18 +08:00
|
|
|
#ifndef HAVE_BROKEN_WCWIDTH
|
2012-11-19 08:30:30 +08:00
|
|
|
#define HAVE_BROKEN_WCWIDTH 1
|
2012-07-16 01:45:18 +08:00
|
|
|
#endif
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
#if !HAVE_BROKEN_WCWIDTH
|
|
|
|
int fish_wcwidth(wchar_t wc) { return wcwidth(wc); }
|
|
|
|
int fish_wcswidth(const wchar_t *str, size_t n) { return wcswidth(str, n); }
|
2012-07-16 01:45:18 +08:00
|
|
|
#else
|
|
|
|
static int mk_wcwidth(wchar_t wc);
|
|
|
|
static int mk_wcswidth(const wchar_t *pwcs, size_t n);
|
2016-04-30 10:01:36 +08:00
|
|
|
int fish_wcwidth(wchar_t wc) { return mk_wcwidth(wc); }
|
|
|
|
int fish_wcswidth(const wchar_t *str, size_t n) { return mk_wcswidth(str, n); }
|
2012-07-16 01:45:18 +08:00
|
|
|
|
|
|
|
/*
|
|
|
|
* This is an implementation of wcwidth() and wcswidth() (defined in
|
|
|
|
* IEEE Std 1002.1-2001) for Unicode.
|
|
|
|
*
|
|
|
|
* http://www.opengroup.org/onlinepubs/007904975/functions/wcwidth.html
|
|
|
|
* http://www.opengroup.org/onlinepubs/007904975/functions/wcswidth.html
|
|
|
|
*
|
|
|
|
* In fixed-width output devices, Latin characters all occupy a single
|
|
|
|
* "cell" position of equal width, whereas ideographic CJK characters
|
|
|
|
* occupy two such cells. Interoperability between terminal-line
|
|
|
|
* applications and (teletype-style) character terminals using the
|
|
|
|
* UTF-8 encoding requires agreement on which character should advance
|
|
|
|
* the cursor by how many cell positions. No established formal
|
|
|
|
* standards exist at present on which Unicode character shall occupy
|
|
|
|
* how many cell positions on character terminals. These routines are
|
|
|
|
* a first attempt of defining such behavior based on simple rules
|
|
|
|
* applied to data provided by the Unicode Consortium.
|
|
|
|
*
|
|
|
|
* For some graphical characters, the Unicode standard explicitly
|
|
|
|
* defines a character-cell width via the definition of the East Asian
|
|
|
|
* FullWidth (F), Wide (W), Half-width (H), and Narrow (Na) classes.
|
|
|
|
* In all these cases, there is no ambiguity about which width a
|
|
|
|
* terminal shall use. For characters in the East Asian Ambiguous (A)
|
|
|
|
* class, the width choice depends purely on a preference of backward
|
|
|
|
* compatibility with either historic CJK or Western practice.
|
|
|
|
* Choosing single-width for these characters is easy to justify as
|
|
|
|
* the appropriate long-term solution, as the CJK practice of
|
|
|
|
* displaying these characters as double-width comes from historic
|
|
|
|
* implementation simplicity (8-bit encoded characters were displayed
|
|
|
|
* single-width and 16-bit ones double-width, even for Greek,
|
|
|
|
* Cyrillic, etc.) and not any typographic considerations.
|
|
|
|
*
|
|
|
|
* Much less clear is the choice of width for the Not East Asian
|
|
|
|
* (Neutral) class. Existing practice does not dictate a width for any
|
|
|
|
* of these characters. It would nevertheless make sense
|
|
|
|
* typographically to allocate two character cells to characters such
|
|
|
|
* as for instance EM SPACE or VOLUME INTEGRAL, which cannot be
|
|
|
|
* represented adequately with a single-width glyph. The following
|
|
|
|
* routines at present merely assign a single-cell width to all
|
|
|
|
* neutral characters, in the interest of simplicity. This is not
|
|
|
|
* entirely satisfactory and should be reconsidered before
|
|
|
|
* establishing a formal standard in this area. At the moment, the
|
|
|
|
* decision which Not East Asian (Neutral) characters should be
|
|
|
|
* represented by double-width glyphs cannot yet be answered by
|
|
|
|
* applying a simple rule from the Unicode database content. Setting
|
|
|
|
* up a proper standard for the behavior of UTF-8 character terminals
|
|
|
|
* will require a careful analysis not only of each Unicode character,
|
|
|
|
* but also of each presentation form, something the author of these
|
|
|
|
* routines has avoided to do so far.
|
|
|
|
*
|
|
|
|
* http://www.unicode.org/unicode/reports/tr11/
|
|
|
|
*
|
|
|
|
* Markus Kuhn -- 2007-05-26 (Unicode 5.0)
|
|
|
|
*
|
|
|
|
* Permission to use, copy, modify, and distribute this software
|
|
|
|
* for any purpose and without fee is hereby granted. The author
|
|
|
|
* disclaims all warranties with regard to this software.
|
|
|
|
*
|
|
|
|
* Latest version: http://www.cl.cam.ac.uk/~mgk25/ucs/wcwidth.c
|
|
|
|
*/
|
2016-04-30 10:01:36 +08:00
|
|
|
struct interval {
|
2012-11-19 08:30:30 +08:00
|
|
|
int first;
|
|
|
|
int last;
|
2012-07-16 01:45:18 +08:00
|
|
|
};
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
// Auxiliary function for binary search in interval table.
|
|
|
|
static int bisearch(wchar_t ucs, const struct interval *table, int max) {
|
2012-11-19 08:30:30 +08:00
|
|
|
int min = 0;
|
2012-07-16 01:45:18 +08:00
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
if (ucs < table[0].first || ucs > table[max].last) return 0;
|
|
|
|
while (max >= min) {
|
2016-02-20 07:45:12 +08:00
|
|
|
int mid = (min + max) / 2;
|
2012-11-19 08:30:30 +08:00
|
|
|
if (ucs > table[mid].last)
|
|
|
|
min = mid + 1;
|
|
|
|
else if (ucs < table[mid].first)
|
|
|
|
max = mid - 1;
|
|
|
|
else
|
|
|
|
return 1;
|
|
|
|
}
|
2012-07-16 01:45:18 +08:00
|
|
|
|
2012-11-19 08:30:30 +08:00
|
|
|
return 0;
|
2012-07-16 01:45:18 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
// The following two functions define the column width of an ISO 10646 character as follows:
|
|
|
|
//
|
|
|
|
// - The null character (U+0000) has a column width of 0.
|
|
|
|
//
|
|
|
|
// - Other C0/C1 control characters and DEL will lead to a return
|
|
|
|
// value of -1.
|
|
|
|
//
|
|
|
|
// - Non-spacing and enclosing combining characters (general
|
|
|
|
// category code Mn or Me in the Unicode database) have a
|
|
|
|
// column width of 0.
|
|
|
|
//
|
|
|
|
// - SOFT HYPHEN (U+00AD) has a column width of 1.
|
|
|
|
//
|
|
|
|
// - Other format characters (general category code Cf in the Unicode
|
|
|
|
// database) and ZERO WIDTH SPACE (U+200B) have a column width of 0.
|
|
|
|
//
|
|
|
|
// - Hangul Jamo medial vowels and final consonants (U+1160-U+11FF)
|
|
|
|
// have a column width of 0.
|
|
|
|
//
|
|
|
|
// - Spacing characters in the East Asian Wide (W) or East Asian
|
|
|
|
// Full-width (F) category as defined in Unicode Technical
|
|
|
|
// Report #11 have a column width of 2.
|
|
|
|
//
|
|
|
|
// - All remaining characters (including all printable
|
|
|
|
// ISO 8859-1 and WGL4 characters, Unicode control characters,
|
|
|
|
// etc.) have a column width of 1.
|
|
|
|
//
|
|
|
|
// This implementation assumes that wchar_t characters are encoded
|
|
|
|
// in ISO 10646.
|
|
|
|
static int mk_wcwidth(wchar_t ucs) {
|
|
|
|
// Sorted list of non-overlapping intervals of non-spacing characters.
|
|
|
|
// Generated by "uniset +cat=Me +cat=Mn +cat=Cf -00AD +1160-11FF +200B c".
|
|
|
|
static const struct interval combining[] = {
|
|
|
|
{0x0300, 0x036F}, {0x0483, 0x0486}, {0x0488, 0x0489}, {0x0591, 0x05BD},
|
|
|
|
{0x05BF, 0x05BF}, {0x05C1, 0x05C2}, {0x05C4, 0x05C5}, {0x05C7, 0x05C7},
|
|
|
|
{0x0600, 0x0603}, {0x0610, 0x0615}, {0x064B, 0x065E}, {0x0670, 0x0670},
|
|
|
|
{0x06D6, 0x06E4}, {0x06E7, 0x06E8}, {0x06EA, 0x06ED}, {0x070F, 0x070F},
|
|
|
|
{0x0711, 0x0711}, {0x0730, 0x074A}, {0x07A6, 0x07B0}, {0x07EB, 0x07F3},
|
|
|
|
{0x0901, 0x0902}, {0x093C, 0x093C}, {0x0941, 0x0948}, {0x094D, 0x094D},
|
|
|
|
{0x0951, 0x0954}, {0x0962, 0x0963}, {0x0981, 0x0981}, {0x09BC, 0x09BC},
|
|
|
|
{0x09C1, 0x09C4}, {0x09CD, 0x09CD}, {0x09E2, 0x09E3}, {0x0A01, 0x0A02},
|
|
|
|
{0x0A3C, 0x0A3C}, {0x0A41, 0x0A42}, {0x0A47, 0x0A48}, {0x0A4B, 0x0A4D},
|
|
|
|
{0x0A70, 0x0A71}, {0x0A81, 0x0A82}, {0x0ABC, 0x0ABC}, {0x0AC1, 0x0AC5},
|
|
|
|
{0x0AC7, 0x0AC8}, {0x0ACD, 0x0ACD}, {0x0AE2, 0x0AE3}, {0x0B01, 0x0B01},
|
|
|
|
{0x0B3C, 0x0B3C}, {0x0B3F, 0x0B3F}, {0x0B41, 0x0B43}, {0x0B4D, 0x0B4D},
|
|
|
|
{0x0B56, 0x0B56}, {0x0B82, 0x0B82}, {0x0BC0, 0x0BC0}, {0x0BCD, 0x0BCD},
|
|
|
|
{0x0C3E, 0x0C40}, {0x0C46, 0x0C48}, {0x0C4A, 0x0C4D}, {0x0C55, 0x0C56},
|
|
|
|
{0x0CBC, 0x0CBC}, {0x0CBF, 0x0CBF}, {0x0CC6, 0x0CC6}, {0x0CCC, 0x0CCD},
|
|
|
|
{0x0CE2, 0x0CE3}, {0x0D41, 0x0D43}, {0x0D4D, 0x0D4D}, {0x0DCA, 0x0DCA},
|
|
|
|
{0x0DD2, 0x0DD4}, {0x0DD6, 0x0DD6}, {0x0E31, 0x0E31}, {0x0E34, 0x0E3A},
|
|
|
|
{0x0E47, 0x0E4E}, {0x0EB1, 0x0EB1}, {0x0EB4, 0x0EB9}, {0x0EBB, 0x0EBC},
|
|
|
|
{0x0EC8, 0x0ECD}, {0x0F18, 0x0F19}, {0x0F35, 0x0F35}, {0x0F37, 0x0F37},
|
|
|
|
{0x0F39, 0x0F39}, {0x0F71, 0x0F7E}, {0x0F80, 0x0F84}, {0x0F86, 0x0F87},
|
|
|
|
{0x0F90, 0x0F97}, {0x0F99, 0x0FBC}, {0x0FC6, 0x0FC6}, {0x102D, 0x1030},
|
|
|
|
{0x1032, 0x1032}, {0x1036, 0x1037}, {0x1039, 0x1039}, {0x1058, 0x1059},
|
|
|
|
{0x1160, 0x11FF}, {0x135F, 0x135F}, {0x1712, 0x1714}, {0x1732, 0x1734},
|
|
|
|
{0x1752, 0x1753}, {0x1772, 0x1773}, {0x17B4, 0x17B5}, {0x17B7, 0x17BD},
|
|
|
|
{0x17C6, 0x17C6}, {0x17C9, 0x17D3}, {0x17DD, 0x17DD}, {0x180B, 0x180D},
|
|
|
|
{0x18A9, 0x18A9}, {0x1920, 0x1922}, {0x1927, 0x1928}, {0x1932, 0x1932},
|
|
|
|
{0x1939, 0x193B}, {0x1A17, 0x1A18}, {0x1B00, 0x1B03}, {0x1B34, 0x1B34},
|
|
|
|
{0x1B36, 0x1B3A}, {0x1B3C, 0x1B3C}, {0x1B42, 0x1B42}, {0x1B6B, 0x1B73},
|
|
|
|
{0x1DC0, 0x1DCA}, {0x1DFE, 0x1DFF}, {0x200B, 0x200F}, {0x202A, 0x202E},
|
|
|
|
{0x2060, 0x2063}, {0x206A, 0x206F}, {0x20D0, 0x20EF}, {0x302A, 0x302F},
|
|
|
|
{0x3099, 0x309A}, {0xA806, 0xA806}, {0xA80B, 0xA80B}, {0xA825, 0xA826},
|
|
|
|
{0xFB1E, 0xFB1E}, {0xFE00, 0xFE0F}, {0xFE20, 0xFE23}, {0xFEFF, 0xFEFF},
|
|
|
|
{0xFFF9, 0xFFFB}, {0x10A01, 0x10A03}, {0x10A05, 0x10A06}, {0x10A0C, 0x10A0F},
|
|
|
|
{0x10A38, 0x10A3A}, {0x10A3F, 0x10A3F}, {0x1D167, 0x1D169}, {0x1D173, 0x1D182},
|
|
|
|
{0x1D185, 0x1D18B}, {0x1D1AA, 0x1D1AD}, {0x1D242, 0x1D244}, {0xE0001, 0xE0001},
|
|
|
|
{0xE0020, 0xE007F}, {0xE0100, 0xE01EF}};
|
|
|
|
|
|
|
|
// Test for 8-bit control characters.
|
|
|
|
if (ucs == 0) return 0;
|
|
|
|
if (ucs < 32 || (ucs >= 0x7f && ucs < 0xa0)) return -1;
|
|
|
|
|
|
|
|
// Binary search in table of non-spacing characters.
|
|
|
|
if (bisearch(ucs, combining, sizeof(combining) / sizeof(struct interval) - 1)) return 0;
|
|
|
|
|
|
|
|
// If we arrive here, ucs is not a combining or C0/C1 control character.
|
|
|
|
return 1 + (ucs >= 0x1100 &&
|
|
|
|
(ucs <= 0x115f || /* Hangul Jamo init. consonants */
|
|
|
|
ucs == 0x2329 || ucs == 0x232a ||
|
|
|
|
(ucs >= 0x2e80 && ucs <= 0xa4cf && ucs != 0x303f) || /* CJK ... Yi */
|
|
|
|
(ucs >= 0xac00 && ucs <= 0xd7a3) || /* Hangul Syllables */
|
|
|
|
(ucs >= 0xf900 && ucs <= 0xfaff) || /* CJK Compatibility Ideographs */
|
|
|
|
(ucs >= 0xfe10 && ucs <= 0xfe19) || /* Vertical forms */
|
|
|
|
(ucs >= 0xfe30 && ucs <= 0xfe6f) || /* CJK Compatibility Forms */
|
|
|
|
(ucs >= 0xff00 && ucs <= 0xff60) || /* Fullwidth Forms */
|
|
|
|
(ucs >= 0xffe0 && ucs <= 0xffe6) || (ucs >= 0x20000 && ucs <= 0x2fffd) ||
|
|
|
|
(ucs >= 0x30000 && ucs <= 0x3fffd)));
|
2012-07-16 01:45:18 +08:00
|
|
|
}
|
|
|
|
|
2016-04-30 10:01:36 +08:00
|
|
|
static int mk_wcswidth(const wchar_t *pwcs, size_t n) {
|
2013-10-16 16:02:15 +08:00
|
|
|
int width = 0;
|
2016-04-30 10:01:36 +08:00
|
|
|
for (size_t i = 0; i < n; i++) {
|
|
|
|
if (pwcs[i] == L'\0') break;
|
2013-10-27 06:27:39 +08:00
|
|
|
|
2013-10-16 16:02:15 +08:00
|
|
|
int w = mk_wcwidth(pwcs[i]);
|
2016-04-30 10:01:36 +08:00
|
|
|
if (w < 0) {
|
2013-10-16 16:02:15 +08:00
|
|
|
width = -1;
|
|
|
|
break;
|
|
|
|
}
|
|
|
|
width += w;
|
|
|
|
}
|
2012-11-19 08:30:30 +08:00
|
|
|
return width;
|
2012-07-16 01:45:18 +08:00
|
|
|
}
|
2016-04-30 10:01:36 +08:00
|
|
|
#endif // HAVE_BROKEN_WCWIDTH
|