fish-shell/src/env_dispatch.cpp

678 lines
26 KiB
C++
Raw Normal View History

// Support for dispatching on environment changes.
#include "config.h" // IWYU pragma: keep
#include <errno.h>
#include <limits.h>
#include <locale.h>
#include <stddef.h>
#include <stdlib.h>
#include <time.h>
#include <unistd.h>
#include <cstring>
#include <cwchar>
#if HAVE_CURSES_H
#include <curses.h>
#elif HAVE_NCURSES_H
#include <ncurses.h>
#elif HAVE_NCURSES_CURSES_H
#include <ncurses/curses.h>
#endif
#if HAVE_TERM_H
#include <term.h>
#elif HAVE_NCURSES_TERM_H
#include <ncurses/term.h>
#endif
#include <assert.h>
#include <algorithm>
#include <functional>
#include <memory>
#include <string>
#include <unordered_map>
#include <utility>
#include "common.h"
#include "complete.h"
#include "env.h"
#include "env_dispatch.h"
#include "env_universal_common.h"
#include "event.h"
#include "fallback.h" // IWYU pragma: keep
#include "flog.h"
#include "function.h"
#include "global_safety.h"
#include "history.h"
#include "input_common.h"
#include "maybe.h"
#include "output.h"
#include "parser.h"
#include "proc.h"
#include "reader.h"
#include "screen.h"
#include "termsize.h"
#include "trace.h"
#include "wutil.h" // IWYU pragma: keep
/// List of all locale environment variable names that might trigger (re)initializing the locale
/// subsystem. These are only the variables we're possibly interested in.
static const wcstring locale_variables[] = {
L"LANG", L"LANGUAGE", L"LC_ALL",
L"LC_COLLATE", L"LC_CTYPE", L"LC_MESSAGES",
L"LC_NUMERIC", L"LC_TIME", L"fish_allow_singlebyte_locale",
L"LOCPATH"};
/// List of all curses environment variable names that might trigger (re)initializing the curses
/// subsystem.
static const wcstring curses_variables[] = {L"TERM", L"TERMINFO", L"TERMINFO_DIRS"};
2019-04-01 02:11:52 +00:00
class var_dispatch_table_t {
using named_callback_t = std::function<void(const wcstring &, env_stack_t &)>;
2019-04-01 02:11:52 +00:00
std::unordered_map<wcstring, named_callback_t> named_table_;
2019-04-01 02:11:52 +00:00
using anon_callback_t = std::function<void(env_stack_t &)>;
std::unordered_map<wcstring, anon_callback_t> anon_table_;
2019-04-01 02:11:52 +00:00
bool observes_var(const wcstring &name) {
return named_table_.count(name) || anon_table_.count(name);
}
public:
/// Add a callback for the given variable, which expects the name.
/// We must not already be observing this variable.
void add(wcstring name, named_callback_t cb) {
assert(!observes_var(name) && "Already observing that variable");
named_table_.emplace(std::move(name), std::move(cb));
}
/// Add a callback for the given variable, which ignores the name.
/// We must not already be observing this variable.
void add(wcstring name, anon_callback_t cb) {
assert(!observes_var(name) && "Already observing that variable");
anon_table_.emplace(std::move(name), std::move(cb));
}
void dispatch(const wcstring &key, env_stack_t &vars) const {
2019-04-01 02:11:52 +00:00
auto named = named_table_.find(key);
if (named != named_table_.end()) {
named->second(key, vars);
2019-04-01 02:11:52 +00:00
}
auto anon = anon_table_.find(key);
if (anon != anon_table_.end()) {
anon->second(vars);
}
}
};
// Forward declarations.
static void init_curses(const environment_t &vars);
static void init_locale(const environment_t &vars);
static void update_fish_color_support(const environment_t &vars);
/// True if we think we can set the terminal title.
static relaxed_atomic_bool_t can_set_term_title{false};
// Run those dispatch functions which want to be run at startup.
static void run_inits(const environment_t &vars);
2019-04-01 02:11:52 +00:00
// return a new-ly allocated dispatch table, running those dispatch functions which should be
// initialized.
static std::unique_ptr<const var_dispatch_table_t> create_dispatch_table();
// A pointer to the variable dispatch table. This is allocated with new() and deliberately leaked to
// avoid shutdown destructors. This is set during startup and should not be modified after.
static latch_t<const var_dispatch_table_t> s_var_dispatch_table;
2019-04-01 02:11:52 +00:00
void env_dispatch_init(const environment_t &vars) {
run_inits(vars);
// Note this deliberately leaks; the dispatch table is immortal.
// Via this construct we can avoid invoking destructors at shutdown.
2019-04-29 02:16:55 +00:00
s_var_dispatch_table = create_dispatch_table();
}
/// Properly sets all timezone information.
static void handle_timezone(const wchar_t *env_var_name, const environment_t &vars) {
const auto var = vars.get(env_var_name, ENV_DEFAULT);
2020-01-19 13:42:12 +00:00
FLOGF(env_dispatch, L"handle_timezone() current timezone var: |%ls| => |%ls|", env_var_name,
!var ? L"MISSING" : var->as_string().c_str());
std::string name = wcs2string(env_var_name);
if (var.missing_or_empty()) {
unsetenv_lock(name.c_str());
} else {
const std::string value = wcs2string(var->as_string());
setenv_lock(name.c_str(), value.c_str(), 1);
}
tzset();
}
/// Update the value of g_fish_emoji_width
static void guess_emoji_width(const environment_t &vars) {
if (auto width_str = vars.get(L"fish_emoji_width")) {
int new_width = fish_wcstol(width_str->as_string().c_str());
2021-11-08 19:36:01 +00:00
g_fish_emoji_width = std::min(2, std::max(1, new_width));
2020-01-30 01:06:11 +00:00
FLOGF(term_support, "'fish_emoji_width' preference: %d, overwriting default",
g_fish_emoji_width);
return;
}
wcstring term;
if (auto term_var = vars.get(L"TERM_PROGRAM")) {
term = term_var->as_string();
}
double version = 0;
if (auto version_var = vars.get(L"TERM_PROGRAM_VERSION")) {
std::string narrow_version = wcs2string(version_var->as_string());
version = strtod(narrow_version.c_str(), nullptr);
}
if (term == L"Apple_Terminal" && version >= 400) {
// Apple Terminal on High Sierra
g_fish_emoji_width = 2;
FLOGF(term_support, "default emoji width: 2 for %ls", term.c_str());
} else if (term == L"iTerm.app") {
// iTerm2 now defaults to Unicode 9 sizes for anything after macOS 10.12.
g_fish_emoji_width = 2;
FLOGF(term_support, "default emoji width for iTerm: 2");
} else {
// Default to whatever system wcwidth says to U+1F603,
// but only if it's at least 1 and at most 2.
int w = wcwidth(L'😃');
2021-11-08 19:36:01 +00:00
g_fish_emoji_width = std::min(2, std::max(1, w));
FLOGF(term_support, "default emoji width: %d", g_fish_emoji_width);
}
}
/// React to modifying the given variable.
void env_dispatch_var_change(const wcstring &key, env_stack_t &vars) {
2019-04-01 02:11:52 +00:00
// Do nothing if not yet fully initialized.
if (!s_var_dispatch_table) return;
s_var_dispatch_table->dispatch(key, vars);
}
static void handle_fish_term_change(const env_stack_t &vars) {
update_fish_color_support(vars);
reader_schedule_prompt_repaint();
}
static void handle_change_ambiguous_width(const env_stack_t &vars) {
int new_width = 1;
if (auto width_str = vars.get(L"fish_ambiguous_width")) {
new_width = fish_wcstol(width_str->as_string().c_str());
}
g_fish_ambiguous_width = std::max(0, new_width);
}
static void handle_term_size_change(const env_stack_t &vars) {
termsize_container_t::shared().handle_columns_lines_var_change(vars);
}
static void handle_fish_history_change(const env_stack_t &vars) {
reader_change_history(history_session_id(vars));
}
static void handle_fish_cursor_selection_mode_change(const env_stack_t &vars) {
auto mode = vars.get(L"fish_cursor_selection_mode");
reader_change_cursor_selection_mode(mode && mode->as_string() == L"inclusive"
? cursor_selection_mode_t::inclusive
: cursor_selection_mode_t::exclusive);
}
void handle_autosuggestion_change(const env_stack_t &vars) {
reader_set_autosuggestion_enabled(vars);
}
static void handle_function_path_change(const env_stack_t &vars) {
UNUSED(vars);
function_invalidate_path();
}
static void handle_complete_path_change(const env_stack_t &vars) {
UNUSED(vars);
complete_invalidate_path();
}
static void handle_tz_change(const wcstring &var_name, const env_stack_t &vars) {
handle_timezone(var_name.c_str(), vars);
}
static void handle_locale_change(const environment_t &vars) {
init_locale(vars);
// We need to re-guess emoji width because the locale might have changed to a multibyte one.
guess_emoji_width(vars);
}
static void handle_curses_change(const environment_t &vars) {
guess_emoji_width(vars);
init_curses(vars);
}
/// Whether to use posix_spawn when possible.
static relaxed_atomic_bool_t g_use_posix_spawn{false};
bool get_use_posix_spawn() { return g_use_posix_spawn; }
extern "C" {
const char *gnu_get_libc_version();
}
static bool allow_use_posix_spawn() {
// OpenBSD's posix_spawn returns status 127, instead of erroring with ENOEXEC, when faced with a
// shebangless script. Disable posix_spawn on OpenBSD.
#if defined(__OpenBSD__)
return false;
#endif
bool result = true;
// uClibc defines __GLIBC__.
#if defined(__GLIBC__) && !defined(__UCLIBC__)
// Disallow posix_spawn entirely on glibc < 2.24.
// See #8021.
if (!__GLIBC_PREREQ(2, 24)) {
result = false;
}
#endif
return result;
}
static void handle_fish_use_posix_spawn_change(const environment_t &vars) {
// Note if the variable is missing or empty, we default to true if allowed.
if (!allow_use_posix_spawn()) {
g_use_posix_spawn = false;
} else if (auto var = vars.get(L"fish_use_posix_spawn")) {
g_use_posix_spawn = var->empty() || bool_from_string(var->as_string());
} else {
g_use_posix_spawn = true;
}
}
/// Allow the user to override the limit on how much data the `read` command will process.
/// This is primarily for testing but could be used by users in special situations.
static void handle_read_limit_change(const environment_t &vars) {
auto read_byte_limit_var = vars.get(L"fish_read_limit");
if (!read_byte_limit_var.missing_or_empty()) {
size_t limit = fish_wcstoull(read_byte_limit_var->as_string().c_str());
if (errno) {
2020-01-19 12:38:47 +00:00
FLOGF(warning, "Ignoring fish_read_limit since it is not valid");
} else {
read_byte_limit = limit;
}
}
}
static void handle_fish_trace(const environment_t &vars) {
trace_set_enabled(!vars.get(L"fish_trace").missing_or_empty());
}
/// Populate the dispatch table used by `env_dispatch_var_change()` to efficiently call the
/// appropriate function to handle a change to a variable.
2019-04-01 02:11:52 +00:00
/// Note this returns a new-allocated value that we expect to leak.
static std::unique_ptr<const var_dispatch_table_t> create_dispatch_table() {
auto var_dispatch_table = make_unique<var_dispatch_table_t>();
for (const auto &var_name : locale_variables) {
2019-04-01 02:11:52 +00:00
var_dispatch_table->add(var_name, handle_locale_change);
}
for (const auto &var_name : curses_variables) {
2019-04-01 02:11:52 +00:00
var_dispatch_table->add(var_name, handle_curses_change);
}
2019-04-01 02:11:52 +00:00
var_dispatch_table->add(L"fish_term256", handle_fish_term_change);
var_dispatch_table->add(L"fish_term24bit", handle_fish_term_change);
var_dispatch_table->add(L"fish_escape_delay_ms", update_wait_on_escape_ms);
var_dispatch_table->add(L"fish_emoji_width", guess_emoji_width);
2019-04-01 02:11:52 +00:00
var_dispatch_table->add(L"fish_ambiguous_width", handle_change_ambiguous_width);
var_dispatch_table->add(L"LINES", handle_term_size_change);
var_dispatch_table->add(L"COLUMNS", handle_term_size_change);
var_dispatch_table->add(L"fish_complete_path", handle_complete_path_change);
var_dispatch_table->add(L"fish_function_path", handle_function_path_change);
var_dispatch_table->add(L"fish_read_limit", handle_read_limit_change);
var_dispatch_table->add(L"fish_history", handle_fish_history_change);
var_dispatch_table->add(L"fish_autosuggestion_enabled", handle_autosuggestion_change);
2019-04-01 02:11:52 +00:00
var_dispatch_table->add(L"TZ", handle_tz_change);
var_dispatch_table->add(L"fish_use_posix_spawn", handle_fish_use_posix_spawn_change);
var_dispatch_table->add(L"fish_trace", handle_fish_trace);
var_dispatch_table->add(L"fish_cursor_selection_mode",
handle_fish_cursor_selection_mode_change);
// This std::move is required to avoid a build error on old versions of libc++ (#5801),
// but it causes a different warning under newer versions of GCC (observed under GCC 9.3.0,
// but not under llvm/clang 9).
#if __GNUC__ > 4
#pragma GCC diagnostic push
#pragma GCC diagnostic ignored "-Wredundant-move"
#endif
return std::move(var_dispatch_table);
#if __GNUC__ > 4
#pragma GCC diagnostic pop
#endif
}
static void run_inits(const environment_t &vars) {
// This is the subset of those dispatch functions which want to be run at startup.
init_locale(vars);
init_curses(vars);
guess_emoji_width(vars);
update_wait_on_escape_ms(vars);
handle_read_limit_change(vars);
handle_fish_use_posix_spawn_change(vars);
handle_fish_trace(vars);
}
/// Updates our idea of whether we support term256 and term24bit (see issue #10222).
static void update_fish_color_support(const environment_t &vars) {
// Detect or infer term256 support. If fish_term256 is set, we respect it;
// otherwise infer it from the TERM variable or use terminfo.
wcstring term;
bool support_term256 = false;
bool support_term24bit = false;
if (auto term_var = vars.get(L"TERM")) term = term_var->as_string();
if (auto fish_term256 = vars.get(L"fish_term256")) {
// $fish_term256
support_term256 = bool_from_string(fish_term256->as_string());
FLOGF(term_support, L"256 color support determined by '$fish_term256'");
} else if (term.find(L"256color") != wcstring::npos) {
// TERM is *256color*: 256 colors explicitly supported
support_term256 = true;
FLOGF(term_support, L"256 color support enabled for TERM=%ls", term.c_str());
} else if (term.find(L"xterm") != wcstring::npos) {
// Assume that all 'xterm's can handle 25
support_term256 = true;
FLOGF(term_support, L"256 color support enabled for TERM=%ls", term.c_str());
} else if (cur_term != nullptr) {
// See if terminfo happens to identify 256 colors
support_term256 = (max_colors >= 256);
FLOGF(term_support, L"256 color support: %d colors per terminfo entry for %ls", max_colors,
term.c_str());
}
// Handle $fish_term24bit
if (auto fish_term24bit = vars.get(L"fish_term24bit")) {
support_term24bit = bool_from_string(fish_term24bit->as_string());
FLOGF(term_support, L"'fish_term24bit' preference: 24-bit color %ls",
support_term24bit ? L"enabled" : L"disabled");
} else {
if (vars.get(L"STY") || string_prefixes_string(L"eterm", term)) {
// Screen and emacs' ansi-term swallow truecolor sequences,
// so we ignore them unless force-enabled.
FLOGF(term_support, L"Truecolor support: disabling for eterm/screen");
support_term24bit = false;
} else if (cur_term != nullptr && max_colors >= 32767) {
// $TERM wins, xterm-direct reports 32767 colors, we assume that's the minimum
// as xterm is weird when it comes to color.
FLOGF(term_support, L"Truecolor support: Enabling per terminfo for %ls with %d colors",
term.c_str(), max_colors);
support_term24bit = true;
} else {
if (auto ct = vars.get(L"COLORTERM")) {
// If someone set $COLORTERM, that's the sort of color they want.
if (ct->as_string() == L"truecolor" || ct->as_string() == L"24bit") {
FLOGF(term_support, L"Truecolor support: Enabling per $COLORTERM='%ls'",
ct->as_string().c_str());
support_term24bit = true;
}
} else if (vars.get(L"KONSOLE_VERSION") || vars.get(L"KONSOLE_PROFILE_NAME")) {
// All konsole versions that use $KONSOLE_VERSION are new enough to support this,
// so no check is necessary.
FLOGF(term_support, L"Truecolor support: Enabling for Konsole");
support_term24bit = true;
} else if (auto it = vars.get(L"ITERM_SESSION_ID")) {
// Supporting versions of iTerm include a colon here.
// We assume that if this is iTerm, it can't also be st, so having this check
// inside is okay.
if (it->as_string().find(L':') != wcstring::npos) {
FLOGF(term_support, L"Truecolor support: Enabling for ITERM");
support_term24bit = true;
}
} else if (string_prefixes_string(L"st-", term)) {
FLOGF(term_support, L"Truecolor support: Enabling for st");
support_term24bit = true;
} else if (auto vte = vars.get(L"VTE_VERSION")) {
if (fish_wcstod(vte->as_string(), nullptr) > 3600) {
FLOGF(term_support, L"Truecolor support: Enabling for VTE version %ls",
vte->as_string().c_str());
support_term24bit = true;
}
}
}
}
color_support_t support = (support_term256 ? color_support_term256 : 0) |
(support_term24bit ? color_support_term24bit : 0);
output_set_color_support(support);
}
// Try to initialize the terminfo/curses subsystem using our fallback terminal name. Do not set
// `TERM` to our fallback. We're only doing this in the hope of getting a functional
// shell. If we launch an external command that uses TERM it should get the same value we were
// given, if any.
static void initialize_curses_using_fallbacks(const environment_t &vars) {
// xterm-256color is the most used terminal type by a massive margin,
// especially counting terminals that are mostly compatible.
const wchar_t *const fallbacks[] = {L"xterm-256color", L"xterm", L"ansi", L"dumb"};
wcstring termstr = L"";
auto term_var = vars.get(L"TERM");
if (!term_var.missing_or_empty()) {
termstr = term_var->as_string();
}
for (const wchar_t *fallback : fallbacks) {
// If $TERM is already set to the fallback name we're about to use there isn't any point in
// seeing if the fallback name can be used.
if (termstr == fallback) {
continue;
}
int err_ret = 0;
std::string term = wcs2string(fallback);
bool success = (setupterm(&term[0], STDOUT_FILENO, &err_ret) == OK);
if (is_interactive_session()) {
if (success) {
FLOGF(warning, _(L"Using fallback terminal type '%s'."), term.c_str());
} else {
FLOGF(warning,
_(L"Could not set up terminal using the fallback terminal type '%s'."),
term.c_str());
}
}
if (success) {
break;
}
}
}
// Apply any platform-specific hacks to cur_term/
static void apply_term_hacks(const environment_t &vars) {
UNUSED(vars);
// Be careful, variables like "enter_italics_mode" are #defined to dereference through cur_term.
// See #8876.
if (!cur_term) {
return;
}
#ifdef __APPLE__
// Hack in missing italics and dim capabilities omitted from MacOS xterm-256color terminfo
// Helps Terminal.app/iTerm
wcstring term_prog;
if (auto var = vars.get(L"TERM_PROGRAM")) {
term_prog = var->as_string();
}
if (term_prog == L"Apple_Terminal" || term_prog == L"iTerm.app") {
const auto term = vars.get(L"TERM");
if (term && term->as_string() == L"xterm-256color") {
static char sitm_esc[] = "\x1B[3m";
static char ritm_esc[] = "\x1B[23m";
static char dim_esc[] = "\x1B[2m";
if (!enter_italics_mode) {
enter_italics_mode = sitm_esc;
}
if (!exit_italics_mode) {
exit_italics_mode = ritm_esc;
}
if (!enter_dim_mode) {
enter_dim_mode = dim_esc;
}
}
}
#endif
}
/// This is a pretty lame heuristic for detecting terminals that do not support setting the
/// title. If we recognise the terminal name as that of a virtual terminal, we assume it supports
/// setting the title. If we recognise it as that of a console, we assume it does not support
/// setting the title. Otherwise we check the ttyname and see if we believe it is a virtual
/// terminal.
///
/// One situation in which this breaks down is with screen, since screen supports setting the
/// terminal title if the underlying terminal does so, but will print garbage on terminals that
/// don't. Since we can't see the underlying terminal below screen there is no way to fix this.
2021-11-08 19:36:01 +00:00
static const wchar_t *const title_terms[] = {L"xterm", L"screen", L"tmux", L"nxterm",
L"rxvt", L"alacritty", L"wezterm"};
static bool does_term_support_setting_title(const environment_t &vars) {
const auto term_var = vars.get(L"TERM");
if (term_var.missing_or_empty()) return false;
const wcstring term_str = term_var->as_string();
const wchar_t *term = term_str.c_str();
bool recognized = contains(title_terms, term_var->as_string());
if (!recognized) recognized = !std::wcsncmp(term, L"xterm-", const_strlen(L"xterm-"));
if (!recognized) recognized = !std::wcsncmp(term, L"screen-", const_strlen(L"screen-"));
if (!recognized) recognized = !std::wcsncmp(term, L"tmux-", const_strlen(L"tmux-"));
if (!recognized) {
if (std::wcscmp(term, L"linux") == 0) return false;
if (std::wcscmp(term, L"dumb") == 0) return false;
// NetBSD
if (std::wcscmp(term, L"vt100") == 0) return false;
if (std::wcscmp(term, L"wsvt25") == 0) return false;
char buf[PATH_MAX];
int retval = ttyname_r(STDIN_FILENO, buf, PATH_MAX);
if (retval != 0 || std::strstr(buf, "tty") || std::strstr(buf, "/vc/")) return false;
}
return true;
}
/// Initialize the curses subsystem.
static void init_curses(const environment_t &vars) {
for (const auto &var_name : curses_variables) {
std::string name = wcs2string(var_name);
const auto var = vars.get(var_name, ENV_EXPORT);
if (var.missing_or_empty()) {
FLOGF(term_support, L"curses var %s missing or empty", name.c_str());
unsetenv_lock(name.c_str());
} else {
std::string value = wcs2string(var->as_string());
FLOGF(term_support, L"curses var %s='%s'", name.c_str(), value.c_str());
setenv_lock(name.c_str(), value.c_str(), 1);
}
}
int err_ret{0};
if (setupterm(nullptr, STDOUT_FILENO, &err_ret) == ERR) {
if (is_interactive_session()) {
auto term = vars.get(L"TERM");
2020-01-19 12:38:47 +00:00
FLOGF(warning, _(L"Could not set up terminal."));
if (term.missing_or_empty()) {
2020-01-19 12:38:47 +00:00
FLOGF(warning, _(L"TERM environment variable not set."));
} else {
2020-01-30 01:06:11 +00:00
FLOGF(warning, _(L"TERM environment variable set to '%ls'."),
term->as_string().c_str());
2020-01-19 12:38:47 +00:00
FLOGF(warning, _(L"Check that this terminal type is supported on this system."));
}
}
initialize_curses_using_fallbacks(vars);
}
apply_term_hacks(vars);
can_set_term_title = does_term_support_setting_title(vars);
term_has_xn =
tigetflag(const_cast<char *>("xenl")) == 1; // does terminal have the eat_newline_glitch
update_fish_color_support(vars);
// Invalidate the cached escape sequences since they may no longer be valid.
layout_cache_t::shared.clear();
curses_initialized = true;
}
static constexpr const char *utf8_locales[] = {
2021-11-08 19:36:01 +00:00
"C.UTF-8", "en_US.UTF-8", "en_GB.UTF-8", "de_DE.UTF-8", "C.utf8", "UTF-8",
Try to set LC_CTYPE to something UTF-8 capable (#8031) * Try to set LC_CTYPE to something UTF-8 capable When fish is started with LC_CTYPE=C (even just effectively, often via LC_ALL=C!), it's basically broken. There's no way to handle non-ASCII characters with a C locale unless we want to write our locale-independent replacements for all of the system functions. Since we're not going to do that, let's try to find *some locale* for LC_CTYPE. We already do that in __fish_setlocale, but that's - a bit of a weird thing that reads unstandardized system configuration files - allows setting locale to C explicitly So it's still easily possible to end up in a broken configuration. Now, the issue with this is that there is (AFAICT) no portable way to get a list of all allowed locales and C.UTF-8 is not standardized, so we have no one locale to fall back on and are forced to try a few. The list we have here is quite arbitrary, but it's a start. Python does something similar and only tries C.UTF-8, C.utf8 and "UTF-8". Once C.UTF-8 is (hopefully) standardized, that will just start working (tm). Note that we do not *export* the fixed LC_CTYPE variable, so external programs still have to deal with the C locale, but we have no real business messing with the user's environment. To turn it off: $fish_allow_singlebyte_locale, if set to something true (like "1"), will re-run the locale initialization and skip the bit where we force LC_CTYPE to be utf8-capable. This is mainly used in our tests, but might also be useful if people are trying to do something weird.
2021-06-06 07:28:32 +00:00
};
/// Initialize the locale subsystem.
static void init_locale(const environment_t &vars) {
// We have to make a copy because the subsequent setlocale() call to change the locale will
// invalidate the pointer from the this setlocale() call.
char *old_msg_locale = strdup(setlocale(LC_MESSAGES, nullptr));
for (const auto &var_name : locale_variables) {
const auto var = vars.get(var_name, ENV_EXPORT);
std::string name = wcs2string(var_name);
if (var.missing_or_empty()) {
FLOGF(env_locale, L"locale var %s missing or empty", name.c_str());
unsetenv_lock(name.c_str());
} else {
const std::string value = wcs2string(var->as_string());
FLOGF(env_locale, L"locale var %s='%s'", name.c_str(), value.c_str());
setenv_lock(name.c_str(), value.c_str(), 1);
}
}
char *locale = setlocale(LC_ALL, "");
Try to set LC_CTYPE to something UTF-8 capable (#8031) * Try to set LC_CTYPE to something UTF-8 capable When fish is started with LC_CTYPE=C (even just effectively, often via LC_ALL=C!), it's basically broken. There's no way to handle non-ASCII characters with a C locale unless we want to write our locale-independent replacements for all of the system functions. Since we're not going to do that, let's try to find *some locale* for LC_CTYPE. We already do that in __fish_setlocale, but that's - a bit of a weird thing that reads unstandardized system configuration files - allows setting locale to C explicitly So it's still easily possible to end up in a broken configuration. Now, the issue with this is that there is (AFAICT) no portable way to get a list of all allowed locales and C.UTF-8 is not standardized, so we have no one locale to fall back on and are forced to try a few. The list we have here is quite arbitrary, but it's a start. Python does something similar and only tries C.UTF-8, C.utf8 and "UTF-8". Once C.UTF-8 is (hopefully) standardized, that will just start working (tm). Note that we do not *export* the fixed LC_CTYPE variable, so external programs still have to deal with the C locale, but we have no real business messing with the user's environment. To turn it off: $fish_allow_singlebyte_locale, if set to something true (like "1"), will re-run the locale initialization and skip the bit where we force LC_CTYPE to be utf8-capable. This is mainly used in our tests, but might also be useful if people are trying to do something weird.
2021-06-06 07:28:32 +00:00
// Try to get a multibyte-capable encoding
// A "C" locale is broken for our purposes - any wchar functions will break on it.
// So we try *really really really hard* to not have one.
bool fix_locale = true;
if (auto allow_c = vars.get(L"fish_allow_singlebyte_locale")) {
fix_locale = allow_c.missing_or_empty() ? true : !bool_from_string(allow_c->as_string());
}
if (fix_locale && MB_CUR_MAX == 1) {
FLOGF(env_locale, L"Have singlebyte locale, trying to fix");
for (auto loc : utf8_locales) {
setlocale(LC_CTYPE, loc);
if (MB_CUR_MAX > 1) {
FLOGF(env_locale, L"Fixed locale: '%s'", loc);
break;
}
}
if (MB_CUR_MAX == 1) {
FLOGF(env_locale, L"Failed to fix locale");
}
}
// We *always* use a C-locale for numbers,
// because we always want "." except for in printf.
setlocale(LC_NUMERIC, "C");
// See that we regenerate our special locale for numbers.
fish_invalidate_numeric_locale();
Try to set LC_CTYPE to something UTF-8 capable (#8031) * Try to set LC_CTYPE to something UTF-8 capable When fish is started with LC_CTYPE=C (even just effectively, often via LC_ALL=C!), it's basically broken. There's no way to handle non-ASCII characters with a C locale unless we want to write our locale-independent replacements for all of the system functions. Since we're not going to do that, let's try to find *some locale* for LC_CTYPE. We already do that in __fish_setlocale, but that's - a bit of a weird thing that reads unstandardized system configuration files - allows setting locale to C explicitly So it's still easily possible to end up in a broken configuration. Now, the issue with this is that there is (AFAICT) no portable way to get a list of all allowed locales and C.UTF-8 is not standardized, so we have no one locale to fall back on and are forced to try a few. The list we have here is quite arbitrary, but it's a start. Python does something similar and only tries C.UTF-8, C.utf8 and "UTF-8". Once C.UTF-8 is (hopefully) standardized, that will just start working (tm). Note that we do not *export* the fixed LC_CTYPE variable, so external programs still have to deal with the C locale, but we have no real business messing with the user's environment. To turn it off: $fish_allow_singlebyte_locale, if set to something true (like "1"), will re-run the locale initialization and skip the bit where we force LC_CTYPE to be utf8-capable. This is mainly used in our tests, but might also be useful if people are trying to do something weird.
2021-06-06 07:28:32 +00:00
fish_setlocale();
FLOGF(env_locale, L"init_locale() setlocale(): '%s'", locale);
const char *new_msg_locale = setlocale(LC_MESSAGES, nullptr);
FLOGF(env_locale, L"old LC_MESSAGES locale: '%s'", old_msg_locale);
FLOGF(env_locale, L"new LC_MESSAGES locale: '%s'", new_msg_locale);
#ifdef HAVE__NL_MSG_CAT_CNTR
if (std::strcmp(old_msg_locale, new_msg_locale) != 0) {
// Make change known to GNU gettext.
extern int _nl_msg_cat_cntr;
_nl_msg_cat_cntr++;
}
#endif
free(old_msg_locale);
}
/// Returns true if we think the terminal supports setting its title.
bool term_supports_setting_title() { return can_set_term_title; }
// Limit `read` to 100 MiB (bytes not wide chars) by default. This can be overridden by the
// fish_read_limit variable.
size_t read_byte_limit = 100 * 1024 * 1024;