fish-shell/src/exec.cpp

// Functions for executing a program.
//
// Some of the code in this file is based on code from the Glibc manual, though the changes
// performed have been massive.
#include "config.h"

#include <errno.h>
#include <fcntl.h>
#ifdef HAVE_SIGINFO_H
#include <siginfo.h>
#endif
#include <signal.h>
#ifdef HAVE_SPAWN_H
#include <spawn.h>
#endif
#include <paths.h>
#include <stdio.h>
#include <sys/wait.h>
#include <unistd.h>

#include <algorithm>
#include <cstring>
#include <functional>
#include <map>
#include <memory>
#include <stack>
#include <string>
#include <type_traits>
#include <vector>

#include "builtin.h"
#include "common.h"
#include "env.h"
#include "exec.h"
#include "fallback.h"  // IWYU pragma: keep
#include "flog.h"
#include "function.h"
#include "io.h"
#include "iothread.h"
#include "job_group.h"
#include "null_terminated_array.h"
#include "parse_tree.h"
#include "parser.h"
#include "path.h"
#include "postfork.h"
#include "proc.h"
#include "reader.h"
#include "redirection.h"
#include "signal.h"
#include "timer.h"
#include "trace.h"
#include "wcstringutil.h"
#include "wutil.h"  // IWYU pragma: keep

/// Number of calls to fork() or posix_spawn().
static relaxed_atomic_t<int> s_fork_count{0};

/// A launch_result_t indicates when a process failed to launch, and therefore the rest of the
/// pipeline should be aborted. This includes failed redirections, fd exhaustion, fork() failures,
/// etc.
enum class launch_result_t {
    ok,
    failed,
} __warn_unused_type;

/// Given an error \p err returned from either posix_spawn or exec, \return a process exit code.
static int exit_code_from_exec_error(int err) {
    assert(err && "Zero is success, not an error");
    switch (err) {
        case ENOENT:
        case ENOTDIR:
            // This indicates either the command was not found, or a file redirection was not found.
            // We do not use posix_spawn file redirections so this is always command-not-found.
            return STATUS_CMD_UNKNOWN;

        case EACCES:
        case ENOEXEC:
            // The file is not executable for various reasons.
            return STATUS_NOT_EXECUTABLE;

#ifdef EBADARCH
        case EBADARCH:
            // This is for e.g. running ARM app on Intel Mac.
            return STATUS_NOT_EXECUTABLE;
#endif
        default:
            // Generic failure.
            return EXIT_FAILURE;
    }
}

/// This is a 'looks like text' check.
/// \return true if either there is no NUL byte, or there is a line containing a lowercase letter
/// before the first NUL byte.
static bool is_thompson_shell_payload(const char *p, size_t n) {
    if (!memchr(p, '\0', n)) return true;
    bool haslower = false;
    for (; *p; p++) {
        if (islower(*p) || *p == '$' || *p == '`') {
            haslower = true;
        }
        if (haslower && *p == '\n') {
            return true;
        }
    }
    return false;
}

/// This function checks the beginning of a file to see if it's safe to
/// pass to the system interpreter when execve() returns ENOEXEC.
///
/// The motivation is to be able to run classic shell scripts which
/// didn't have shebang, while protecting the user from accidentally
/// running a binary file which may corrupt terminal driver state. We
/// check for lowercase letters because the ASCII magic of binary files
/// is usually uppercase, e.g. PNG, JFIF, MZ, etc. These rules are also
/// flexible enough to permit scripts with concatenated binary content,
/// such as Actually Portable Executable.
/// N.B.: this is called after fork, it must not allocate heap memory.
bool is_thompson_shell_script(const char *path) {
    // Paths ending in ".fish" are never considered Thompson shell scripts.
    if (const char *lastdot = strrchr(path, '.')) {
        if (0 == strcmp(lastdot, ".fish")) {
            return false;
        }
    }
    int e = errno;
    bool res = false;
    int fd = open_cloexec(path, O_RDONLY | O_NOCTTY);
    if (fd != -1) {
        char buf[256];
        ssize_t got = read(fd, buf, sizeof(buf));
        close(fd);
        if (got >= 0 && is_thompson_shell_payload(buf, static_cast<size_t>(got))) {
            res = true;
        }
    }
    errno = e;
    return res;
}

/// This function is executed by the child process created by a call to fork(). It should be called
/// after \c child_setup_process. It calls execve to replace the fish process image with the command
/// specified in \c p. It never returns. Called in a forked child! Do not allocate memory, etc.
[[noreturn]] static void safe_launch_process(process_t *p, const char *actual_cmd,
                                             const char *const *cargv, const char *const *cenvv) {
    UNUSED(p);
    int err;

    // This function never returns, so we take certain liberties with constness.
    auto envv = const_cast<char **>(cenvv);
    auto argv = const_cast<char **>(cargv);
    auto cmd2 = const_cast<char *>(actual_cmd);

    execve(actual_cmd, argv, envv);
    err = errno;

    // The shebang wasn't introduced until UNIX Seventh Edition, so if
    // the kernel won't run the binary we hand it off to the interpreter
    // after performing a binary safety check, recommended by POSIX: a
    // line needs to exist before the first \0 with a lowercase letter
    if (err == ENOEXEC && is_thompson_shell_script(actual_cmd)) {
        // Construct new argv.
        // We must not allocate memory, so only 128 args are supported.
        constexpr size_t maxargs = 128;
        size_t nargs = 0;
        while (argv[nargs]) nargs++;
        if (nargs <= maxargs) {
            char *argv2[1 + maxargs + 1];  // +1 for /bin/sh, +1 for terminating nullptr
            char interp[] = _PATH_BSHELL;
            argv2[0] = interp;
            std::copy_n(argv, 1 + nargs, &argv2[1]);  // +1 to copy terminating nullptr
            // The command to call should use the full path,
            // not what we would pass as argv0.
            argv2[1] = cmd2;
            execve(_PATH_BSHELL, argv2, envv);
        }
    }

    errno = err;
    safe_report_exec_error(errno, actual_cmd, argv, envv);
    exit_without_destructors(exit_code_from_exec_error(err));
}

/// This function is similar to launch_process, except it is not called after a fork (i.e. it only
/// calls exec) and therefore it can allocate memory.
[[noreturn]] static void launch_process_nofork(env_stack_t &vars, process_t *p) {
    ASSERT_IS_NOT_FORKED_CHILD();

    // Construct argv. Ensure the strings stay alive for the duration of this function.
    std::vector<std::string> narrow_strings = wide_string_list_to_narrow(p->argv());
    null_terminated_array_t<char> narrow_argv(narrow_strings);
    const char **argv = narrow_argv.get();

    // Construct envp.
    auto export_vars = vars.export_arr();
    const char **envp = export_vars->get();
    std::string actual_cmd = wcs2string(p->actual_cmd);

    // Ensure the terminal modes are what they were before we changed them.
    restore_term_mode();
    // Bounce to launch_process. This never returns.
    safe_launch_process(p, actual_cmd.c_str(), argv, envp);
}

// Returns whether we can use posix spawn for a given process in a given job.
//
// To avoid the race between the caller calling tcsetpgrp() and the client checking the
// foreground process group, we don't use posix_spawn if we're going to foreground the process. (If
// we use fork(), we can call tcsetpgrp after the fork, before the exec, and avoid the race).
static bool can_use_posix_spawn_for_job(const std::shared_ptr<job_t> &job,
                                        const dup2_list_t &dup2s) {
    // Is it globally disabled?
    if (!get_use_posix_spawn()) return false;

    // Hack - do not use posix_spawn if there are self-fd redirections.
    // For example if you were to write:
    //   cmd 6< /dev/null
    // it is possible that the open() of /dev/null would result in fd 6. Here even if we attempted
    // to add a dup2 action, it would be ignored and the CLO_EXEC bit would remain. So don't use
    // posix_spawn in this case; instead we'll call fork() and clear the CLO_EXEC bit manually.
    for (const auto &action : dup2s.get_actions()) {
        if (action.src == action.target) return false;
    }
    if (job->group->wants_terminal()) {
        // This job will be foregrounded, so we will call tcsetpgrp(), therefore do not use
        // posix_spawn.
        return false;
    }
    return true;
}

static void internal_exec(env_stack_t &vars, job_t *j, const io_chain_t &block_io) {
    // Do a regular launch -  but without forking first...
    process_t *p = j->processes.front().get();
    io_chain_t all_ios = block_io;
    if (!all_ios.append_from_specs(p->redirection_specs(), vars.get_pwd_slash())) {
        return;
    }

    // child_setup_process makes sure signals are properly set up.
    dup2_list_t redirs = dup2_list_t::resolve_chain(all_ios);
    if (child_setup_process(false /* not claim_tty */, *j, false /* not is_forked */, redirs) ==
        0) {
        // Decrement SHLVL as we're removing ourselves from the shell "stack".
        if (is_interactive_session()) {
            auto shlvl_var = vars.get(L"SHLVL", ENV_GLOBAL | ENV_EXPORT);
            wcstring shlvl_str = L"0";
            if (shlvl_var) {
                long shlvl = fish_wcstol(shlvl_var->as_string().c_str());
                if (!errno && shlvl > 0) {
                    shlvl_str = to_string(shlvl - 1);
                }
            }
            vars.set_one(L"SHLVL", ENV_GLOBAL | ENV_EXPORT, std::move(shlvl_str));
        }

        // launch_process _never_ returns.
        launch_process_nofork(vars, p);
    }
}

/// Construct an internal process for the process p. In the background, write the data \p outdata to
/// stdout and \p errdata to stderr, respecting the io chain \p ios. For example if target_fd is 1
/// (stdout), and there is a dup2 3->1, then we need to write to fd 3. Then exit the internal
/// process.
static void run_internal_process(process_t *p, std::string &&outdata, std::string &&errdata,
                                 const io_chain_t &ios) {
    p->check_generations_before_launch();

    // We want both the dup2s and the io_chain_ts to be kept alive by the background thread, because
    // they may own an fd that we want to write to. Move them all to a shared_ptr. The strings as
    // well (they may be long).
    // Construct a little helper struct to make it simpler to move into our closure without copying.
    struct write_fields_t {
        int src_outfd{-1};
        std::string outdata{};

        int src_errfd{-1};
        std::string errdata{};

        io_chain_t ios{};
        maybe_t<dup2_list_t> dup2s{};
        std::shared_ptr<internal_proc_t> internal_proc{};

        proc_status_t success_status{};

        bool skip_out() const { return outdata.empty() || src_outfd < 0; }

        bool skip_err() const { return errdata.empty() || src_errfd < 0; }
    };

    auto f = std::make_shared<write_fields_t>();
    f->outdata = std::move(outdata);
    f->errdata = std::move(errdata);

    // Construct and assign the internal process to the real process.
    p->internal_proc_ = std::make_shared<internal_proc_t>();
    f->internal_proc = p->internal_proc_;

    FLOGF(proc_internal_proc, L"Created internal proc %llu to write output for proc '%ls'",
          p->internal_proc_->get_id(), p->argv0());

    // Resolve the IO chain.
    // Note it's important we do this even if we have no out or err data, because we may have been
    // asked to truncate a file (e.g. `echo -n '' > /tmp/truncateme.txt'). The open() in the dup2
    // list resolution will ensure this happens.
    f->dup2s = dup2_list_t::resolve_chain(ios);

    // Figure out which source fds to write to. If they are closed (unlikely) we just exit
    // successfully.
    f->src_outfd = f->dup2s->fd_for_target_fd(STDOUT_FILENO);
    f->src_errfd = f->dup2s->fd_for_target_fd(STDERR_FILENO);

    // If we have nothing to write we can elide the thread.
    // TODO: support eliding output to /dev/null.
    if (f->skip_out() && f->skip_err()) {
        f->internal_proc->mark_exited(p->status);
        return;
    }

    // Ensure that ios stays alive, it may own fds.
    f->ios = ios;

    // If our process is a builtin, it will have already set its status value. Make sure we
    // propagate that if our I/O succeeds and don't read it on a background thread. TODO: have
    // builtin_run provide this directly, rather than setting it in the process.
    f->success_status = p->status;

    iothread_perform_cantwait([f]() {
        proc_status_t status = f->success_status;
        if (!f->skip_out()) {
            ssize_t ret = write_loop(f->src_outfd, f->outdata.data(), f->outdata.size());
            if (ret < 0) {
                if (errno != EPIPE) {
                    wperror(L"write");
                }
                if (status.is_success()) {
                    status = proc_status_t::from_exit_code(1);
                }
            }
        }
        if (!f->skip_err()) {
            ssize_t ret = write_loop(f->src_errfd, f->errdata.data(), f->errdata.size());
            if (ret < 0) {
                if (errno != EPIPE) {
                    wperror(L"write");
                }
                if (status.is_success()) {
                    status = proc_status_t::from_exit_code(1);
                }
            }
        }
        f->internal_proc->mark_exited(status);
    });
}

/// If \p outdata or \p errdata are both empty, then mark the process as completed immediately.
/// Otherwise, run an internal process.
static void run_internal_process_or_short_circuit(parser_t &parser, const std::shared_ptr<job_t> &j,
                                                  process_t *p, std::string &&outdata,
                                                  std::string &&errdata, const io_chain_t &ios) {
    if (outdata.empty() && errdata.empty()) {
        p->completed = true;
        if (p->is_last_in_job) {
            FLOGF(exec_job_status, L"Set status of job %d (%ls) to %d using short circuit",
                  j->job_id(), j->preview().c_str(), p->status);
            auto statuses = j->get_statuses();
            if (statuses) {
                parser.set_last_statuses(statuses.value());
                parser.libdata().status_count++;
            } else if (j->flags().negate) {
                // Special handling for `not set var (substitution)`.
                // If there is no status, but negation was requested,
                // take the last status and negate it.
                auto last_statuses = parser.get_last_statuses();
                last_statuses.status = !last_statuses.status;
                parser.set_last_statuses(last_statuses);
            }
        }
    } else {
        run_internal_process(p, std::move(outdata), std::move(errdata), ios);
    }
}

bool blocked_signals_for_job(const job_t &job, sigset_t *sigmask) {
    // Block some signals in background jobs for which job control is turned off (#6828).
    if (!job.is_foreground() && !job.wants_job_control()) {
        sigaddset(sigmask, SIGINT);
        sigaddset(sigmask, SIGQUIT);
        return true;
    }
    return false;
}

/// Call fork() as part of executing a process \p p in a job \j. Execute \p child_action in the
/// context of the child.
static launch_result_t fork_child_for_process(const std::shared_ptr<job_t> &job, process_t *p,
                                              const dup2_list_t &dup2s, const char *fork_type,
                                              const std::function<void()> &child_action) {
    // Claim the tty from fish, if the job wants it and we are the pgroup leader.
    pid_t claim_tty_from =
        (p->leads_pgrp && job->group->wants_terminal()) ? getpgrp() : INVALID_PID;

    pid_t pid = execute_fork();
    if (pid < 0) {
        return launch_result_t::failed;
    }
    const bool is_parent = (pid > 0);

    // Record the pgroup if this is the leader.
    // Both parent and child attempt to send the process to its new group, to resolve the race.
    p->pid = is_parent ? pid : getpid();
    if (p->leads_pgrp) {
        job->group->set_pgid(p->pid);
    }
    if (auto pgid = job->group->get_pgid()) {
        if (int err = execute_setpgid(p->pid, *pgid, is_parent)) {
            report_setpgid_error(err, is_parent, *pgid, job.get(), p);
        }
    }

    if (!is_parent) {
        // Child process.
        child_setup_process(claim_tty_from, *job, true, dup2s);
        child_action();
        DIE("Child process returned control to fork_child lambda!");
    }

    ++s_fork_count;
    FLOGF(exec_fork, L"Fork #%d, pid %d: %s for '%ls'", int(s_fork_count), pid, fork_type,
          p->argv0());
    return launch_result_t::ok;
}

/// \return an newly allocated output stream for the given fd, which is typically stdout or stderr.
/// This inspects the io_chain and decides what sort of output stream to return.
/// If \p piped_output_needs_buffering is set, and if the output is going to a pipe, then the other
/// end then synchronously writing to the pipe risks deadlock, so we must buffer it.
static std::shared_ptr<output_stream_t> create_output_stream_for_builtin(
    int fd, const io_chain_t &io_chain, bool piped_output_needs_buffering) {
    using std::make_shared;
    const shared_ptr<const io_data_t> io = io_chain.io_for_fd(fd);
    if (io == nullptr) {
        // Common case of no redirections.
        // Just write to the fd directly.
        return make_shared<fd_output_stream_t>(fd);
    }
    switch (io->io_mode) {
        case io_mode_t::bufferfill: {
            // Our IO redirection is to an internal buffer, e.g. a command substitution.
            // We will write directly to it.
            std::shared_ptr<io_buffer_t> buffer =
                std::static_pointer_cast<const io_bufferfill_t>(io)->buffer();
            return make_unique<buffered_output_stream_t>(buffer);
        }

        case io_mode_t::close:
            // Like 'echo foo >&-'
            return make_shared<null_output_stream_t>();

        case io_mode_t::file:
            // Output is to a file which has been opened.
            return make_shared<fd_output_stream_t>(io->source_fd);

        case io_mode_t::pipe:
            // Output is to a pipe. We may need to buffer.
            if (piped_output_needs_buffering) {
                return make_shared<string_output_stream_t>();
            } else {
                return make_shared<fd_output_stream_t>(io->source_fd);
            }

        case io_mode_t::fd:
            // This is a case like 'echo foo >&5'
            // It's uncommon and unclear what should happen.
            return make_shared<string_output_stream_t>();
    }
    DIE("Unreachable");
}

/// Handle output from a builtin, by printing the contents of builtin_io_streams to the redirections
/// given in io_chain.
static void handle_builtin_output(parser_t &parser, const std::shared_ptr<job_t> &j, process_t *p,
                                  const io_chain_t &io_chain, const output_stream_t &out,
                                  const output_stream_t &err) {
    assert(p->type == process_type_t::builtin && "Process is not a builtin");

    // Figure out any data remaining to write. We may have none, in which case we can short-circuit.
    std::string outbuff = wcs2string(out.contents());
    std::string errbuff = wcs2string(err.contents());

    // Some historical behavior.
    if (!outbuff.empty()) fflush(stdout);
    if (!errbuff.empty()) fflush(stderr);

    // Construct and run our background process.
    run_internal_process_or_short_circuit(parser, j, p, std::move(outbuff), std::move(errbuff),
                                          io_chain);
}

/// Executes an external command.
/// An error return here indicates that the process failed to launch, and the rest of
/// the pipeline should be cancelled.
static launch_result_t exec_external_command(parser_t &parser, const std::shared_ptr<job_t> &j,
                                             process_t *p, const io_chain_t &proc_io_chain) {
    assert(p->type == process_type_t::external && "Process is not external");
    // Get argv and envv before we fork.
    const std::vector<std::string> narrow_argv = wide_string_list_to_narrow(p->argv());
    null_terminated_array_t<char> argv_array(narrow_argv);

    // Convert our IO chain to a dup2 sequence.
    auto dup2s = dup2_list_t::resolve_chain(proc_io_chain);

    // Ensure that stdin is blocking before we hand it off (see issue #176).
    // Note this will also affect stdout and stderr if they refer to the same tty.
    make_fd_blocking(STDIN_FILENO);

    auto export_arr = parser.vars().export_arr();
    const char *const *argv = argv_array.get();
    const char *const *envv = export_arr->get();

    std::string actual_cmd_str = wcs2string(p->actual_cmd);
    const char *actual_cmd = actual_cmd_str.c_str();
    const wchar_t *file = parser.libdata().current_filename;

#if FISH_USE_POSIX_SPAWN
    // Prefer to use posix_spawn, since it's faster on some systems like OS X.
    if (can_use_posix_spawn_for_job(j, dup2s)) {
        ++s_fork_count;  // spawn counts as a fork+exec

        posix_spawner_t spawner(j.get(), dup2s);
        maybe_t<pid_t> pid = spawner.spawn(actual_cmd, const_cast<char *const *>(argv),
                                           const_cast<char *const *>(envv));
        if (int err = spawner.get_error()) {
            safe_report_exec_error(err, actual_cmd, argv, envv);
            p->status = proc_status_t::from_exit_code(exit_code_from_exec_error(err));
            return launch_result_t::failed;
        }
        assert(pid.has_value() && *pid > 0 && "Should have either a valid pid, or an error");

        // This usleep can be used to test for various race conditions
        // (https://github.com/fish-shell/fish-shell/issues/360).
        // usleep(10000);

        FLOGF(exec_fork, L"Fork #%d, pid %d: spawn external command '%s' from '%ls'",
              int(s_fork_count), *pid, actual_cmd, file ? file : L"<no file>");

        // these are all things do_fork() takes care of normally (for forked processes):
        p->pid = *pid;
        if (p->leads_pgrp) {
            j->group->set_pgid(p->pid);
            // posix_spawn should in principle set the pgid before returning.
            // In glibc, posix_spawn uses fork() and the pgid group is set on the child side;
            // therefore the parent may not have seen it be set yet.
            // Ensure it gets set. See #4715, also https://github.com/Microsoft/WSL/issues/2997.
            execute_setpgid(p->pid, p->pid, true /* is parent */);
        }
        return launch_result_t::ok;
    } else
#endif
    {
        return fork_child_for_process(j, p, dup2s, "external command",
                                      [&] { safe_launch_process(p, actual_cmd, argv, envv); });
    }
}

// Given that we are about to execute a function, push a function block and set up the
// variable environment.
static block_t *function_prepare_environment(parser_t &parser, wcstring_list_t argv,
                                             const function_properties_t &props) {
    // Extract the function name and remaining arguments.
    wcstring func_name;
    if (!argv.empty()) {
        // Extract and remove the function name from argv.
        func_name = std::move(*argv.begin());
        argv.erase(argv.begin());
    }
    block_t *fb = parser.push_block(block_t::function_block(func_name, argv, props.shadow_scope));
    auto &vars = parser.vars();

    // Setup the environment for the function. There are three components of the environment:
    // 1. named arguments
    // 2. inherited variables
    // 3. argv

    size_t idx = 0;
    for (const wcstring &named_arg : props.named_arguments) {
        if (idx < argv.size()) {
            vars.set_one(named_arg, ENV_LOCAL | ENV_USER, argv.at(idx));
        } else {
            vars.set_empty(named_arg, ENV_LOCAL | ENV_USER);
        }
        idx++;
    }

    for (const auto &kv : props.inherit_vars) {
        vars.set(kv.first, ENV_LOCAL | ENV_USER, kv.second);
    }

    vars.set_argv(std::move(argv));
    return fb;
}

// Given that we are done executing a function, restore the environment.
static void function_restore_environment(parser_t &parser, const block_t *block) {
    parser.pop_block(block);

    // If we returned due to a return statement, then stop returning now.
    parser.libdata().returning = false;
}

// The "performer" function of a block or function process.
// This accepts a place to execute as \p parser and then executes the result, returning a status.
// This is factored out in this funny way in preparation for concurrent execution.
using proc_performer_t = std::function<proc_status_t(parser_t &parser)>;

// \return a function which may be to run the given process \p.
// May return an empty std::function in the rare case that the to-be called fish function no longer
// exists. This is just a dumb artifact of the fact that we only capture the functions name, not its
// properties, when creating the job; thus a race could delete the function before we fetch its
// properties.
static proc_performer_t get_performer_for_process(process_t *p, job_t *job,
                                                  const io_chain_t &io_chain) {
    assert((p->type == process_type_t::function || p->type == process_type_t::block_node) &&
           "Unexpected process type");
    // We want to capture the job group.
    job_group_ref_t job_group = job->group;

    if (p->type == process_type_t::block_node) {
        const parsed_source_ref_t &source = p->block_node_source;
        const ast::statement_t *node = p->internal_block_node;
        assert(source && node && "Process is missing node info");
        return [=](parser_t &parser) {
            return parser.eval_node(source, *node, io_chain, job_group).status;
        };
    } else {
        assert(p->type == process_type_t::function);
        auto props = function_get_props(p->argv0());
        if (!props) {
            FLOGF(error, _(L"Unknown function '%ls'"), p->argv0());
            return proc_performer_t{};
        }
        const wcstring_list_t &argv = p->argv();
        return [=](parser_t &parser) {
            // Pull out the job list from the function.
            const ast::job_list_t &body = props->func_node->jobs;
            const block_t *fb = function_prepare_environment(parser, argv, *props);
            auto res = parser.eval_node(props->parsed_source, body, io_chain, job_group);
            function_restore_environment(parser, fb);

            // If the function did not execute anything, treat it as success.
            if (res.was_empty) {
                res = proc_status_t::from_exit_code(EXIT_SUCCESS);
            }
            return res.status;
        };
    }
}

/// Execute a block node or function "process".
/// \p piped_output_needs_buffering if true, buffer the output.
static launch_result_t exec_block_or_func_process(parser_t &parser, const std::shared_ptr<job_t> &j,
                                                  process_t *p, io_chain_t io_chain,
                                                  bool piped_output_needs_buffering) {
    // Create an output buffer if we're piping to another process.
    shared_ptr<io_bufferfill_t> block_output_bufferfill{};
    if (piped_output_needs_buffering) {
        // Be careful to handle failure, e.g. too many open fds.
        block_output_bufferfill = io_bufferfill_t::create();
        if (!block_output_bufferfill) {
            return launch_result_t::failed;
        }
        // Teach the job about its bufferfill, and add it to our io chain.
        io_chain.push_back(block_output_bufferfill);
    }

    // Get the process performer, and just execute it directly.
    // Do it in this scoped way so that the performer function can be eagerly deallocating releasing
    // its captured io chain.
    if (proc_performer_t performer = get_performer_for_process(p, j.get(), io_chain)) {
        p->status = performer(parser);
    } else {
        return launch_result_t::failed;
    }

    // If we have a block output buffer, populate it now.
    std::string buffer_contents;
    if (block_output_bufferfill) {
        // Remove our write pipe and forget it. This may close the pipe, unless another thread has
        // claimed it (background write) or another process has inherited it.
        io_chain.remove(block_output_bufferfill);
        buffer_contents =
            io_bufferfill_t::finish(std::move(block_output_bufferfill)).newline_serialized();
    }

    run_internal_process_or_short_circuit(parser, j, p, std::move(buffer_contents),
                                          {} /* errdata */, io_chain);
    return launch_result_t::ok;
}

static proc_performer_t get_performer_for_builtin(
    process_t *p, job_t *job, const io_chain_t &io_chain,
    const std::shared_ptr<output_stream_t> &output_stream,
    const std::shared_ptr<output_stream_t> &errput_stream) {
    assert(p->type == process_type_t::builtin && "Process must be a builtin");

    // Determine if we have a "direct" redirection for stdin.
    bool stdin_is_directly_redirected = false;
    if (!p->is_first_in_job) {
        // We must have a pipe
        stdin_is_directly_redirected = true;
    } else {
        // We are not a pipe. Check if there is a redirection local to the process
        // that's not io_mode_t::close.
        for (const auto &redir : p->redirection_specs()) {
            if (redir.fd == STDIN_FILENO && !redir.is_close()) {
                stdin_is_directly_redirected = true;
                break;
            }
        }
    }

    // Pull out some fields which we want to copy. We don't want to store the process or job in the
    // returned closure.
    job_group_ref_t job_group = job->group;
    const wcstring_list_t &argv = p->argv();

    // Be careful to not capture p or j by value, as the intent is that this may be run on another
    // thread.
    return [=](parser_t &parser) {
        auto out_io = io_chain.io_for_fd(STDOUT_FILENO);
        auto err_io = io_chain.io_for_fd(STDERR_FILENO);

        // Figure out what fd to use for the builtin's stdin.
        int local_builtin_stdin = STDIN_FILENO;
        if (const auto in = io_chain.io_for_fd(STDIN_FILENO)) {
            // Ignore fd redirections from an fd other than the
            // standard ones. e.g. in source <&3 don't actually read from fd 3,
            // which is internal to fish. We still respect this redirection in
            // that we pass it on as a block IO to the code that source runs,
            // and therefore this is not an error.
            bool ignore_redirect = in->io_mode == io_mode_t::fd && in->source_fd >= 3;
            if (!ignore_redirect) {
                local_builtin_stdin = in->source_fd;
            }
        }

        // Populate our io_streams_t. This is a bag of information for the builtin.
        io_streams_t streams{*output_stream, *errput_stream};
        streams.job_group = job_group;
        streams.stdin_fd = local_builtin_stdin;
        streams.stdin_is_directly_redirected = stdin_is_directly_redirected;
        streams.out_is_redirected = out_io != nullptr;
        streams.err_is_redirected = err_io != nullptr;
        streams.out_is_piped = (out_io && out_io->io_mode == io_mode_t::pipe);
        streams.err_is_piped = (err_io && err_io->io_mode == io_mode_t::pipe);
        streams.io_chain = &io_chain;

        // Execute the builtin.
        return builtin_run(parser, argv, streams);
    };
}

/// Executes a builtin "process".
static launch_result_t exec_builtin_process(parser_t &parser, const std::shared_ptr<job_t> &j,
                                            process_t *p, const io_chain_t &io_chain,
                                            bool piped_output_needs_buffering) {
    assert(p->type == process_type_t::builtin && "Process is not a builtin");
    std::shared_ptr<output_stream_t> out =
        create_output_stream_for_builtin(STDOUT_FILENO, io_chain, piped_output_needs_buffering);
    std::shared_ptr<output_stream_t> err =
        create_output_stream_for_builtin(STDERR_FILENO, io_chain, piped_output_needs_buffering);

    if (proc_performer_t performer = get_performer_for_builtin(p, j.get(), io_chain, out, err)) {
        p->status = performer(parser);
    } else {
        return launch_result_t::failed;
    }
    handle_builtin_output(parser, j, p, io_chain, *out, *err);
    return launch_result_t::ok;
}

/// Executes a process \p \p in \p job, using the pipes \p pipes (which may have invalid fds if this
/// is the first or last process).
/// \p deferred_pipes represents the pipes from our deferred process; if set ensure they get closed
/// in any child. If \p is_deferred_run is true, then this is a deferred run; this affects how
/// certain buffering works.
/// An error return here indicates that the process failed to launch, and the rest of
/// the pipeline should be cancelled.
static launch_result_t exec_process_in_job(parser_t &parser, process_t *p,
                                           const std::shared_ptr<job_t> &j,
                                           const io_chain_t &block_io, autoclose_pipes_t pipes,
                                           const autoclose_pipes_t &deferred_pipes,
                                           bool is_deferred_run = false) {
    // The write pipe (destined for stdout) needs to occur before redirections. For example,
    // with a redirection like this:
    //
    //   `foo 2>&1 | bar`
    //
    // what we want to happen is this:
    //
    //    dup2(pipe, stdout)
    //    dup2(stdout, stderr)
    //
    // so that stdout and stderr both wind up referencing the pipe.
    //
    // The read pipe (destined for stdin) is more ambiguous. Imagine a pipeline like this:
    //
    //   echo alpha | cat < beta.txt
    //
    // Should cat output alpha or beta? bash and ksh output 'beta', tcsh gets it right and
    // complains about ambiguity, and zsh outputs both (!). No shells appear to output 'alpha',
    // so we match bash here. That would mean putting the pipe first, so that it gets trumped by
    // the file redirection.
    //
    // However, eval does this:
    //
    //   echo "begin; $argv "\n" ;end <&3 3<&-" | source 3<&0
    //
    // which depends on the redirection being evaluated before the pipe. So the write end of the
    // pipe comes first, the read pipe of the pipe comes last. See issue #966.

    // Maybe trace this process.
    // TODO: 'and' and 'or' will not show.
    if (trace_enabled(parser)) {
        trace_argv(parser, nullptr, p->argv());
    }

    // The IO chain for this process.
    io_chain_t process_net_io_chain = block_io;

    if (pipes.write.valid()) {
        process_net_io_chain.push_back(std::make_shared<io_pipe_t>(
            p->pipe_write_fd, false /* not input */, std::move(pipes.write)));
    }

    // Append IOs from the process's redirection specs.
    // This may fail, e.g. a failed redirection.
    if (!process_net_io_chain.append_from_specs(p->redirection_specs(),
                                                parser.vars().get_pwd_slash())) {
        return launch_result_t::failed;
    }

    // Read pipe goes last.
    shared_ptr<io_pipe_t> pipe_read{};
    if (pipes.read.valid()) {
        pipe_read =
            std::make_shared<io_pipe_t>(STDIN_FILENO, true /* input */, std::move(pipes.read));
        process_net_io_chain.push_back(pipe_read);
    }

    // If we have stashed pipes, make sure those get closed in the child.
    for (const autoclose_fd_t *afd : {&deferred_pipes.read, &deferred_pipes.write}) {
        if (afd->valid()) {
            process_net_io_chain.push_back(std::make_shared<io_close_t>(afd->fd()));
        }
    }

    if (p->type != process_type_t::block_node) {
        // A simple `begin ... end` should not be considered an execution of a command.
        parser.libdata().exec_count++;
    }

    const block_t *block = nullptr;
    cleanup_t pop_block([&]() {
        if (block) parser.pop_block(block);
    });
    if (!p->variable_assignments.empty()) {
        block = parser.push_block(block_t::variable_assignment_block());
    }
    for (const auto &assignment : p->variable_assignments) {
        parser.vars().set(assignment.variable_name, ENV_LOCAL | ENV_EXPORT, assignment.values);
    }

    // Decide if outputting to a pipe may deadlock.
    // This happens if fish pipes from an internal process into another internal process:
    //    echo $big | string match...
    // Here fish will only run one process at a time, so the pipe buffer may overfill.
    // It may also happen when piping internal -> external:
    //    echo $big | external_proc
    // fish wants to run `echo` before launching external_proc, so the pipe may deadlock.
    // However if we are a deferred run, it means that we are piping into an external process
    // which got launched before us!
    bool piped_output_needs_buffering = !p->is_last_in_job && !is_deferred_run;

    // Execute the process.
    p->check_generations_before_launch();
    switch (p->type) {
        case process_type_t::function:
        case process_type_t::block_node: {
            if (exec_block_or_func_process(parser, j, p, process_net_io_chain,
                                           piped_output_needs_buffering) ==
                launch_result_t::failed) {
                return launch_result_t::failed;
            }
            break;
        }

        case process_type_t::builtin: {
            if (exec_builtin_process(parser, j, p, process_net_io_chain,
                                     piped_output_needs_buffering) == launch_result_t::failed) {
                return launch_result_t::failed;
            }
            break;
        }

        case process_type_t::external: {
            if (exec_external_command(parser, j, p, process_net_io_chain) ==
                launch_result_t::failed) {
                return launch_result_t::failed;
            }
            // It's possible (though unlikely) that this is a background process which recycled a
            // pid from another, previous background process. Forget any such old process.
            parser.get_wait_handles().remove_by_pid(p->pid);
            break;
        }

        case process_type_t::exec: {
            // We should have handled exec up above.
            DIE("process_type_t::exec process found in pipeline, where it should never be. "
                "Aborting.");
        }
    }
    return launch_result_t::ok;
}

// Do we have a fish internal process that pipes into a real process? If so, we are going to
// launch it last (if there's more than one, just the last one). That is to prevent buffering
// from blocking further processes. See #1396.
// Example:
//   for i in (seq 1 5); sleep 1; echo $i; end | cat
// This should show the output as it comes, not buffer until the end.
// Any such process (only one per job) will be called the "deferred" process.
static process_t *get_deferred_process(const shared_ptr<job_t> &j) {
    // Common case is no deferred proc.
    if (j->processes.size() <= 1) return nullptr;

    // Skip execs, which can only appear at the front.
    if (j->processes.front()->type == process_type_t::exec) return nullptr;

    // Find the last non-external process, and return it if it pipes into an extenal process.
    for (auto i = j->processes.rbegin(); i != j->processes.rend(); ++i) {
        process_t *p = i->get();
        if (p->type != process_type_t::external) {
            return p->is_last_in_job ? nullptr : p;
        }
    }
    return nullptr;
}

/// Given that we failed to execute process \p failed_proc in job \p job, mark that process and
/// every subsequent process in the pipeline as aborted before launch.
static void abort_pipeline_from(const shared_ptr<job_t> &job, const process_t *failed_proc) {
    bool found = false;
    for (process_ptr_t &p : job->processes) {
        found = found || (p.get() == failed_proc);
        if (found) p->mark_aborted_before_launch();
    }
    assert(found && "Process not present in job");
}

// Given that we are about to execute an exec() call, check if the parser is interactive and there
// are extant background jobs. If so, warn the user and do not exec().
// \return true if we should allow exec, false to disallow it.
static bool allow_exec_with_background_jobs(parser_t &parser) {
    // If we're not interactive, we cannot warn.
    if (!parser.is_interactive()) return true;

    // Construct the list of running background jobs.
    job_list_t bgs = jobs_requiring_warning_on_exit(parser);
    if (bgs.empty()) return true;

    // Compare run counts, so we only warn once.
    uint64_t current_run_count = reader_run_count();
    uint64_t &last_exec_run_count = parser.libdata().last_exec_run_counter;
    if (isatty(STDIN_FILENO) && current_run_count - 1 != last_exec_run_count) {
        print_exit_warning_for_jobs(bgs);
        last_exec_run_count = current_run_count;
        return false;
    } else {
        hup_jobs(parser.jobs());
        return true;
    }
}

bool exec_job(parser_t &parser, const shared_ptr<job_t> &j, const io_chain_t &block_io) {
    assert(j && "null job_t passed to exec_job!");

    // If fish was invoked with -n or --no-execute, then no_exec will be set and we do nothing.
    if (no_exec()) {
        return true;
    }

    // Handle an exec call.
    if (j->processes.front()->type == process_type_t::exec) {
        // If we are interactive, perhaps disallow exec if there are background jobs.
        if (!allow_exec_with_background_jobs(parser)) {
            for (const auto &p : j->processes) {
                p->mark_aborted_before_launch();
            }
            return false;
        }

        internal_exec(parser.vars(), j.get(), block_io);
        // internal_exec only returns if it failed to set up redirections.
        // In case of an successful exec, this code is not reached.
        int status = j->flags().negate ? 0 : 1;
        parser.set_last_statuses(statuses_t::just(status));

        // A false return tells the caller to remove the job from the list.
        for (const auto &p : j->processes) {
            p->mark_aborted_before_launch();
        }
        return false;
    }
    cleanup_t timer = push_timer(j->wants_timing() && !no_exec());

    // Get the deferred process, if any. We will have to remember its pipes.
    autoclose_pipes_t deferred_pipes;
    process_t *const deferred_process = get_deferred_process(j);

    // We may want to transfer tty ownership to the pgroup leader.
    tty_transfer_t transfer{};

    // This loop loops over every process_t in the job, starting it as appropriate. This turns out
    // to be rather complex, since a process_t can be one of many rather different things.
    //
    // The loop also has to handle pipelining between the jobs.
    //
    // We can have up to three pipes "in flight" at a time:
    //
    // 1. The pipe the current process should read from (courtesy of the previous process)
    // 2. The pipe that the current process should write to
    // 3. The pipe that the next process should read from (courtesy of us)
    //
    // Lastly, a process may experience a pipeline-aborting error, which prevents launching
    // further processes in the pipeline.
    autoclose_fd_t pipe_next_read;
    bool aborted_pipeline = false;
    size_t procs_launched = 0;
    for (const auto &procptr : j->processes) {
        process_t *p = procptr.get();

        // proc_pipes is the pipes applied to this process. That is, it is the read end
        // containing the output of the previous process (if any), plus the write end that will
        // output to the next process (if any).
        autoclose_pipes_t proc_pipes;
        proc_pipes.read = std::move(pipe_next_read);
        if (!p->is_last_in_job) {
            auto pipes = make_autoclose_pipes();
            if (!pipes) {
                FLOGF(warning, PIPE_ERROR);
                wperror(L"pipe");
                aborted_pipeline = true;
                abort_pipeline_from(j, p);
                break;
            }
            pipe_next_read = std::move(pipes->read);
            proc_pipes.write = std::move(pipes->write);

            // Save any deferred process for last. By definition, the deferred process can never be
            // the last process in the job, so it's safe to nest this in the outer
            // `if (!p->is_last_in_job)` block, which makes it clear that `proc_next_read` will
            // always be assigned when we `continue` the loop.
            if (p == deferred_process) {
                deferred_pipes = std::move(proc_pipes);
                continue;
            }
        }

        // Regular process.
        if (exec_process_in_job(parser, p, j, block_io, std::move(proc_pipes), deferred_pipes) ==
            launch_result_t::failed) {
            aborted_pipeline = true;
            abort_pipeline_from(j, p);
            break;
        }
        procs_launched += 1;

        // Transfer tty?
        if (p->leads_pgrp && j->group->wants_terminal()) {
            transfer.to_job_group(j->group);
        }
    }
    pipe_next_read.close();

    // If our pipeline was aborted before any process was successfully launched, then there is
    // nothing to reap, and we can perform an early return.
    // Note we must never return false if we have launched even one process, since it will not be
    // properly reaped; see #7038.
    if (aborted_pipeline && procs_launched == 0) {
        return false;
    }

    // Ok, at least one thing got launched.
    // Handle any deferred process.
    if (deferred_process) {
        if (aborted_pipeline) {
            // Some other process already aborted our pipeline.
            deferred_process->mark_aborted_before_launch();
        } else if (exec_process_in_job(parser, deferred_process, j, block_io,
                                       std::move(deferred_pipes), {},
                                       true) == launch_result_t::failed) {
            // The deferred proc itself failed to launch.
            deferred_process->mark_aborted_before_launch();
        }
    }

    FLOGF(exec_job_exec, L"Executed job %d from command '%ls'", j->job_id(), j->command_wcstr());

    j->mark_constructed();

    // If exec_error then a backgrounded job would have been terminated before it was ever assigned
    // a pgroup, so error out before setting last_pid.
    if (!j->is_foreground()) {
        if (maybe_t<pid_t> last_pid = j->get_last_pid()) {
            parser.vars().set_one(L"last_pid", ENV_GLOBAL, to_string(*last_pid));
        } else {
            parser.vars().set_empty(L"last_pid", ENV_GLOBAL);
        }
    }

    if (!j->is_initially_background()) {
        j->continue_job(parser);
    }

    if (j->is_stopped()) transfer.save_tty_modes();
    transfer.reclaim();
    return true;
}

/// Populate \p lst with the output of \p buffer, perhaps splitting lines according to \p split.
static void populate_subshell_output(wcstring_list_t *lst, const separated_buffer_t &buffer,
                                     bool split) {
    // Walk over all the elements.
    for (const auto &elem : buffer.elements()) {
        if (elem.is_explicitly_separated()) {
            // Just append this one.
            lst->push_back(str2wcstring(elem.contents));
            continue;
        }

        // Not explicitly separated. We have to split it explicitly.
        assert(!elem.is_explicitly_separated() && "should not be explicitly separated");
        const char *begin = elem.contents.data();
        const char *end = begin + elem.contents.size();
        if (split) {
            const char *cursor = begin;
            while (cursor < end) {
                // Look for the next separator.
                auto stop = static_cast<const char *>(std::memchr(cursor, '\n', end - cursor));
                const bool hit_separator = (stop != nullptr);
                if (!hit_separator) {
                    // If it's not found, just use the end.
                    stop = end;
                }
                // Stop now points at the first character we do not want to copy.
                lst->push_back(str2wcstring(cursor, stop - cursor));

                // If we hit a separator, skip over it; otherwise we're at the end.
                cursor = stop + (hit_separator ? 1 : 0);
            }
        } else {
            // We're not splitting output, but we still want to trim off a trailing newline.
            if (end != begin && end[-1] == '\n') {
                --end;
            }
            lst->push_back(str2wcstring(begin, end - begin));
        }
    }
}

/// Execute \p cmd in a subshell in \p parser. If \p lst is not null, populate it with the output.
/// Return $status in \p out_status.
/// If \p job_group is set, any spawned commands should join that job group.
/// If \p apply_exit_status is false, then reset $status back to its original value.
/// \p is_subcmd controls whether we apply a read limit.
/// \p break_expand is used to propagate whether the result should be "expansion breaking" in the
/// sense that subshells used during string expansion should halt that expansion. \return the value
/// of $status.
static int exec_subshell_internal(const wcstring &cmd, parser_t &parser,
                                  const job_group_ref_t &job_group, wcstring_list_t *lst,
                                  bool *break_expand, bool apply_exit_status, bool is_subcmd) {
    parser.assert_can_execute();
    auto &ld = parser.libdata();

    scoped_push<bool> is_subshell(&ld.is_subshell, true);
    scoped_push<size_t> read_limit(&ld.read_limit, is_subcmd ? read_byte_limit : 0);

    auto prev_statuses = parser.get_last_statuses();
    const cleanup_t put_back([&] {
        if (!apply_exit_status) {
            parser.set_last_statuses(prev_statuses);
        }
    });

    const bool split_output = !parser.vars().get(L"IFS").missing_or_empty();

    // IO buffer creation may fail (e.g. if we have too many open files to make a pipe), so this may
    // be null.
    auto bufferfill = io_bufferfill_t::create(ld.read_limit);
    if (!bufferfill) {
        *break_expand = true;
        return STATUS_CMD_ERROR;
    }
    eval_res_t eval_res = parser.eval(cmd, io_chain_t{bufferfill}, job_group, block_type_t::subst);
    separated_buffer_t buffer = io_bufferfill_t::finish(std::move(bufferfill));
    if (buffer.discarded()) {
        *break_expand = true;
        return STATUS_READ_TOO_MUCH;
    }

    if (eval_res.break_expand) {
        *break_expand = true;
        return eval_res.status.status_value();
    }

    if (lst) {
        populate_subshell_output(lst, buffer, split_output);
    }
    *break_expand = false;
    return eval_res.status.status_value();
}

int exec_subshell_for_expand(const wcstring &cmd, parser_t &parser,
                             const job_group_ref_t &job_group, wcstring_list_t &outputs) {
    parser.assert_can_execute();
    bool break_expand = false;
    int ret = exec_subshell_internal(cmd, parser, job_group, &outputs, &break_expand, true, true);
    // Only return an error code if we should break expansion.
    return break_expand ? ret : STATUS_CMD_OK;
}

int exec_subshell(const wcstring &cmd, parser_t &parser, bool apply_exit_status) {
    bool break_expand = false;
    return exec_subshell_internal(cmd, parser, nullptr, nullptr, &break_expand, apply_exit_status,
                                  false);
}

int exec_subshell(const wcstring &cmd, parser_t &parser, wcstring_list_t &outputs,
                  bool apply_exit_status) {
    bool break_expand = false;
    return exec_subshell_internal(cmd, parser, nullptr, &outputs, &break_expand, apply_exit_status,
                                  false);
}
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								// Functions for executing a program.
 								//
 								// Some of the code in this file is based on code from the Glibc manual, though the changes
 								// performed have been massive.
-												add better support for IWYU and fix things

Remove the "make iwyu" build target. Move the functionality into the
recently introduced lint.fish script. Fix a lot, but not all, of the
include-what-you-use errors. Specifically, it fixes all of the IWYU errors
on my OS X server but only removes some of them on my Ubuntu 14.04 server.

Fixes #2957

											
										
										
											2016-04-21 06:00:54 +00:00
+								#include "config.h"
-												Rearrange includes so that config.h is always the first file to be included

darcs-hash:20060811011835-ac50b-847fc790288e3bb3f3a0ee7734ff278d2dc65bef.gz

											
										
										
											2006-08-11 01:18:35 +00:00
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include <errno.h>
 								#include <fcntl.h>
-												lint cleanups

											
										
										
											2017-02-11 02:47:02 +00:00
+								#ifdef HAVE_SIGINFO_H
 								#include <siginfo.h>
 								#endif
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include <signal.h>
-												lint cleanups

											
										
										
											2017-02-11 02:47:02 +00:00
+								#ifdef HAVE_SPAWN_H
 								#include <spawn.h>
 								#endif
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								#include <paths.h>
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								#include <stdio.h>
-												Fixed race condition in new job control synchronization

We were having child processes SIGSTOP themselves immediately after
setting their process group and before launching their intended targets,
but they were not necessarily stopped by the time the next command was
being executed (so the opposite of the original race condition where
they might have finished executing by the time the next command came
around), and as a result when we sent them SIGCONT, that could never
reach. Now using waitpid to synchronize the SIGSTOP/SIGCONT between the
two.

If we had a good, unnamed inter-process event/semaphore, we could use
that to have a child process conditionally stop itself if the next
command in the job chain hadn't yet been started / setup, but this is
probably a lot more straightforward and less-confusing, which isn't a
bad thing.

Additionally, there was a bug caused by the fact that the main exec_job
loop actually blocks to read from previous commands in the job if the
current command is a built-in that doesn't need to fork.

With this waitpid code, I was able to finally add the SIGSTOP code to
all the fork'd processes in the main exec_job loop without introducing
deadlocks; it turns out that they should be treated just like the main
EXTERNAL fork, but they tend to execute faster causing the same deadlock
described above to occur more readily.

The only thing I'm not sure about is whether we should execute
unblock_pid undconditionally for all !EXTERNAL commands. It makes more
sense to *only* do that if a blocking read were about to be done in the
main loop, otherwise the original race condition could still appear
(though it is probably mitigated by whatever duration the SIGSTOP lasted
for, even if it is SIGCONT'd before the next command tries to join the
process group).

											
										
										
											2017-07-26 19:19:00 +00:00
+								#include <sys/wait.h>
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								#include <unistd.h>
-												lint cleanups

											
										
										
											2017-02-11 02:47:02 +00:00
-												Fixed compilation with recent changes on Linux.

											
										
										
											2012-02-10 15:55:06 +00:00
+								#include <algorithm>
-												Run clang-format on all files

The main change here is to reorder headers.

											
										
										
											2019-10-13 22:50:48 +00:00
+								#include <cstring>
-												lint and style cleanups

											
										
										
											2017-08-06 22:47:01 +00:00
+								#include <functional>
-												Initial pass with Include What You Use

											
										
										
											2015-07-25 15:14:25 +00:00
+								#include <map>
-												add better support for IWYU and fix things

Remove the "make iwyu" build target. Move the functionality into the
recently introduced lint.fish script. Fix a lot, but not all, of the
include-what-you-use errors. Specifically, it fixes all of the IWYU errors
on my OS X server but only removes some of them on my Ubuntu 14.04 server.

Fixes #2957

											
										
										
											2016-04-21 06:00:54 +00:00
+								#include <memory>
-												Run clang-format on all files

The main change here is to reorder headers.

											
										
										
											2019-10-13 22:50:48 +00:00
+								#include <stack>
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include <string>
-												lint cleanups

											
										
										
											2017-02-11 02:47:02 +00:00
+								#include <type_traits>
 								#include <vector>
-												Include siginfo.h in all signal-using files to make Solaris happy. Thanks to Netocrat for the report and a description of the solution.

darcs-hash:20060730202659-ac50b-1840aff40ec2467242bd107676c7426cdb14f643.gz

											
										
										
											2006-07-30 20:26:59 +00:00
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "builtin.h"
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								#include "common.h"
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "env.h"
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								#include "exec.h"
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "fallback.h"  // IWYU pragma: keep
-												Convert job logging from debug to FLOG

											
										
										
											2019-05-18 20:47:27 +00:00
+								#include "flog.h"
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								#include "function.h"
-												Initial pass with Include What You Use

											
										
										
											2015-07-25 15:14:25 +00:00
+								#include "io.h"
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								#include "iothread.h"
-												Factor job groups into their own file

Migrate out of proc.h, which has become too long.

											
										
										
											2020-07-19 23:41:58 +00:00
+								#include "job_group.h"
-												Migrate a bunch of code out of common.h

Put it into wcstringutil, path, or a new file null_terminated_array.

											
										
										
											2020-01-15 21:16:43 +00:00
+								#include "null_terminated_array.h"
-												Initial pass with Include What You Use

											
										
										
											2015-07-25 15:14:25 +00:00
+								#include "parse_tree.h"
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "parser.h"
-												Accept a pwd in resolve_file_redirections_to_fds

Conceptually allow multiple of these to run in parallel

											
										
										
											2019-07-16 01:03:50 +00:00
+								#include "path.h"
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "postfork.h"
 								#include "proc.h"
-												restore the terminal modes before an "exec"

When replacing the existing fish process with a new process it is
important to restore the temrinal modes to what they were when fish
started running. We don't want any tweaks done for the benefit of fish
(e.g., disabling ICRNL mode) to bleed thru to an "exec"ed command.

Resolves #2609

											
										
										
											2015-12-15 01:21:43 +00:00
+								#include "reader.h"
-												Adopt dup2_list_t in fork execution path

This switches IO redirections after fork() to use the dup2_list_t,
instead of io_chain_t. This results in simpler code with much simpler
error handling.

											
										
										
											2019-01-28 22:35:56 +00:00
+								#include "redirection.h"
-												lint and style cleanups

											
										
										
											2017-08-06 22:47:01 +00:00
+								#include "signal.h"
-												Make "time" a job prefix

In particular, this allows `true && time true`, or `true; and time true`,
and both `time not true` as well as `not time true` (like bash).

time is valid only as job _prefix_, so `true | time true` could call
`/bin/time` (same in bash)

See discussion in #6442

											
										
										
											2019-12-21 10:45:07 +00:00
+								#include "timer.h"
-												Add support for fish_trace variable to trace execution

This adds support for `fish_trace`, a new variable intended to serve the
same purpose as `set -x` as in bash. Setting this variable to anything
non-empty causes execution to be traced. In the future we may give more
specific meaning to the value of the variable.

The user's prompt is not traced unless you run it explicitly. Events are
also not traced because it is noisy; however autoloading is.

Fixes #3427

											
										
										
											2019-10-19 01:08:22 +00:00
+								#include "trace.h"
-												Stop #include-ing wcstringutil.h in flog.h

This is a header dependency that we can break.

											
										
										
											2020-07-29 23:37:23 +00:00
+								#include "wcstringutil.h"
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								#include "wutil.h"  // IWYU pragma: keep
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
-												Clean up g_fork_count

Make it static and atomic

											
										
										
											2019-06-03 19:58:35 +00:00
+								/// Number of calls to fork() or posix_spawn().
 								static relaxed_atomic_t<int> s_fork_count{0};
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								/// A launch_result_t indicates when a process failed to launch, and therefore the rest of the
 								/// pipeline should be aborted. This includes failed redirections, fd exhaustion, fork() failures,
 								/// etc.
 								enum class launch_result_t {
 								    ok,
 								    failed,
 								} __warn_unused_type;
-												Rationalize exit codes for failed execs

This cleans up some exit code processing. Previously a failed exec
would produce exit code 125 unconditionally, while a failed posix_spawn
would produce exit code 1 (!).

With this change, fish reports exit code 126 for not-executable, and 127
for file-not-found. This matches bash.

											
										
										
											2021-03-28 04:21:29 +00:00
+								/// Given an error \p err returned from either posix_spawn or exec, \return a process exit code.
 								static int exit_code_from_exec_error(int err) {
 								    assert(err && "Zero is success, not an error");
 								    switch (err) {
 								        case ENOENT:
 								        case ENOTDIR:
 								            // This indicates either the command was not found, or a file redirection was not found.
 								            // We do not use posix_spawn file redirections so this is always command-not-found.
 								            return STATUS_CMD_UNKNOWN;
 								        case EACCES:
 								        case ENOEXEC:
 								            // The file is not executable for various reasons.
 								            return STATUS_NOT_EXECUTABLE;
 								#ifdef EBADARCH
 								        case EBADARCH:
 								            // This is for e.g. running ARM app on Intel Mac.
 								            return STATUS_NOT_EXECUTABLE;
 								#endif
 								        default:
 								            // Generic failure.
 								            return EXIT_FAILURE;
 								    }
 								}
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								/// This is a 'looks like text' check.
 								/// \return true if either there is no NUL byte, or there is a line containing a lowercase letter
 								/// before the first NUL byte.
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								static bool is_thompson_shell_payload(const char *p, size_t n) {
 								    if (!memchr(p, '\0', n)) return true;
 								    bool haslower = false;
 								    for (; *p; p++) {
 								        if (islower(*p) || *p == '$' || *p == '`') {
 								            haslower = true;
 								        }
 								        if (haslower && *p == '\n') {
 								            return true;
 								        }
 								    }
 								    return false;
 								}
 								/// This function checks the beginning of a file to see if it's safe to
 								/// pass to the system interpreter when execve() returns ENOEXEC.
 								///
 								/// The motivation is to be able to run classic shell scripts which
 								/// didn't have shebang, while protecting the user from accidentally
 								/// running a binary file which may corrupt terminal driver state. We
 								/// check for lowercase letters because the ASCII magic of binary files
 								/// is usually uppercase, e.g. PNG, JFIF, MZ, etc. These rules are also
 								/// flexible enough to permit scripts with concatenated binary content,
 								/// such as Actually Portable Executable.
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								/// N.B.: this is called after fork, it must not allocate heap memory.
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								bool is_thompson_shell_script(const char *path) {
-												Do not implicitly pass .fish files to /bin/sh

This expands the heuristic introduced in #7802 to prevent implicitly
passing files ending in .fish to /bin/sh.

											
										
										
											2021-03-28 02:17:18 +00:00
+								    // Paths ending in ".fish" are never considered Thompson shell scripts.
 								    if (const char *lastdot = strrchr(path, '.')) {
 								        if (0 == strcmp(lastdot, ".fish")) {
 								            return false;
 								        }
 								    }
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								    int e = errno;
 								    bool res = false;
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								    int fd = open_cloexec(path, O_RDONLY | O_NOCTTY);
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								    if (fd != -1) {
 								        char buf[256];
 								        ssize_t got = read(fd, buf, sizeof(buf));
 								        close(fd);
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								        if (got >= 0 && is_thompson_shell_payload(buf, static_cast<size_t>(got))) {
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								            res = true;
 								        }
 								    }
 								    errno = e;
 								    return res;
 								}
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								/// This function is executed by the child process created by a call to fork(). It should be called
-												Rename setup_child_process to child_setup_process

Try to name all functions called after fork with "child" prefix.

											
										
										
											2019-06-22 22:10:54 +00:00
+								/// after \c child_setup_process. It calls execve to replace the fish process image with the command
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								/// specified in \c p. It never returns. Called in a forked child! Do not allocate memory, etc.
-												Restyle

More of that weird reflowing that clang-format loves to do

											
										
										
											2020-04-21 17:24:33 +00:00
+								[[noreturn]] static void safe_launch_process(process_t *p, const char *actual_cmd,
 								                                             const char *const *cargv, const char *const *cenvv) {
-												eliminate many "unused parameter" warnings

Partially addresses issue #3430.

											
										
										
											2016-10-09 21:38:26 +00:00
+								    UNUSED(p);
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    int err;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								    // This function never returns, so we take certain liberties with constness.
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								    auto envv = const_cast<char **>(cenvv);
 								    auto argv = const_cast<char **>(cargv);
-												Use the full path for noshebang'd scripts

If you make a script called `foo` somewhere in $PATH, and did not give
it a shebang, this would end up calling

    sh foo

instead of

    sh /usr/bin/foo

which might not match up.

Especially if the path is e.g. `--version` or `-` that would end up
being misinterpreted *by sh*.

So instead we simply pass the actual_cmd to sh, because we need it
anyway to get it to fail to execute before.

											
										
										
											2021-12-02 20:10:57 +00:00
+								    auto cmd2 = const_cast<char *>(actual_cmd);
-												Cleanup and simplify null_terminated_array_t and its clients

											
										
										
											2013-02-23 00:22:56 +00:00
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    execve(actual_cmd, argv, envv);
 								    err = errno;
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								    // The shebang wasn't introduced until UNIX Seventh Edition, so if
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								    // the kernel won't run the binary we hand it off to the interpreter
-												Allow more scripts without #!

This change modifies the fish safety check surrounding execve / spawn so
it can run shell scripts having concatenated binary content. We're using
the same safety check as FreeBSD /bin/sh [1] and the Z-shell [5].  POSIX
was recently revised to require this behavior:

    "The input file may be of any type, but the initial portion of the
     file intended to be parsed according to the shell grammar (XREF to
     XSH 2.10.2 Shell Grammar Rules) shall consist of characters and
     shall not contain the NUL character. The shell shall not enforce
     any line length limits."

    "Earlier versions of this standard required that input files to the
     shell be text files except that line lengths were unlimited.
     However, that was overly restrictive in relation to the fact that
     shells can parse a script without a trailing newline, and in
     relation to a common practice of concatenating a shell script
     ending with an 'exit' or 'exec $command' with a binary data payload
     to form a single-file self-extracting archive." [2] [3]

One example use case of such scripts, is the Cosmopolitan C Library [4]
which configuse the GNU Linker to output a polyglot shell+binary format
that runs on Linux / Mac / Windows / FreeBSD / OpenBSD / NetBSD / BIOS.

Fixes jart/cosmopolitan#88

[1] https://github.com/freebsd/freebsd-src/commit/9a1cd363318b7e9e70ef6af27d1675b371c16b1a
[2] http://austingroupbugs.net/view.php?id=1250
[3] http://austingroupbugs.net/view.php?id=1226#c4394
[4] https://justine.lol/cosmopolitan/index.html
[5] https://github.com/zsh-users/zsh/commit/326d9c203b3980c0f841bc62b06e37134c6e51ea

											
										
										
											2021-03-09 00:29:45 +00:00
+								    // after performing a binary safety check, recommended by POSIX: a
 								    // line needs to exist before the first \0 with a lowercase letter
 								    if (err == ENOEXEC && is_thompson_shell_script(actual_cmd)) {
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								        // Construct new argv.
 								        // We must not allocate memory, so only 128 args are supported.
 								        constexpr size_t maxargs = 128;
 								        size_t nargs = 0;
 								        while (argv[nargs]) nargs++;
 								        if (nargs <= maxargs) {
 								            char *argv2[1 + maxargs + 1];  // +1 for /bin/sh, +1 for terminating nullptr
 								            char interp[] = _PATH_BSHELL;
 								            argv2[0] = interp;
 								            std::copy_n(argv, 1 + nargs, &argv2[1]);  // +1 to copy terminating nullptr
-												Use the full path for noshebang'd scripts

If you make a script called `foo` somewhere in $PATH, and did not give
it a shebang, this would end up calling

    sh foo

instead of

    sh /usr/bin/foo

which might not match up.

Especially if the path is e.g. `--version` or `-` that would end up
being misinterpreted *by sh*.

So instead we simply pass the actual_cmd to sh, because we need it
anyway to get it to fail to execute before.

											
										
										
											2021-12-02 20:10:57 +00:00
+								            // The command to call should use the full path,
 								            // not what we would pass as argv0.
 								            argv2[1] = cmd2;
-												Clean up and relnote shebangless script support

This adds a test for shebangless support from #7802, cleans up some of
its tricks, and includes it in the changelog.

											
										
										
											2021-03-27 23:07:57 +00:00
+								            execve(_PATH_BSHELL, argv2, envv);
 								        }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
+								    }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    errno = err;
-												Adopt posix_spawn (!)
Rewrite IO chains to be a vector of pointers, instead of a linked list
Removed io_transmogrify

											
										
										
											2012-08-15 07:57:56 +00:00
+								    safe_report_exec_error(errno, actual_cmd, argv, envv);
-												Rationalize exit codes for failed execs

This cleans up some exit code processing. Previously a failed exec
would produce exit code 125 unconditionally, while a failed posix_spawn
would produce exit code 1 (!).

With this change, fish reports exit code 126 for not-executable, and 127
for file-not-found. This matches bash.

											
										
										
											2021-03-28 04:21:29 +00:00
+								    exit_without_destructors(exit_code_from_exec_error(err));
-												More work towards improving relationship between multithreading and fork

											
										
										
											2012-02-29 19:27:14 +00:00
+								}
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								/// This function is similar to launch_process, except it is not called after a fork (i.e. it only
 								/// calls exec) and therefore it can allocate memory.
-												Restyle

More of that weird reflowing that clang-format loves to do

											
										
										
											2020-04-21 17:24:33 +00:00
+								[[noreturn]] static void launch_process_nofork(env_stack_t &vars, process_t *p) {
-												More work towards improving relationship between multithreading and fork

											
										
										
											2012-02-29 19:27:14 +00:00
+								    ASSERT_IS_NOT_FORKED_CHILD();
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								    // Construct argv. Ensure the strings stay alive for the duration of this function.
 								    std::vector<std::string> narrow_strings = wide_string_list_to_narrow(p->argv());
 								    null_terminated_array_t<char> narrow_argv(narrow_strings);
 								    const char **argv = narrow_argv.get();
-												Eliminate wcsv2strv

											
										
										
											2014-10-31 01:10:06 +00:00
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								    // Construct envp.
-												Reimplement the whole variable stack

The variable stack is a mess - confused locking, surprising callouts, and
unclear division of labor. Just reimplement the whole thing.

											
										
										
											2019-05-10 16:10:43 +00:00
+								    auto export_vars = vars.export_arr();
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								    const char **envp = export_vars->get();
-												Eliminate wcs2str

Use std::string variants everywhere instead

											
										
										
											2020-07-29 23:37:23 +00:00
+								    std::string actual_cmd = wcs2string(p->actual_cmd);
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								    // Ensure the terminal modes are what they were before we changed them.
-												restore the terminal modes before an "exec"

When replacing the existing fish process with a new process it is
important to restore the temrinal modes to what they were when fish
started running. We don't want any tweaks done for the benefit of fish
(e.g., disabling ICRNL mode) to bleed thru to an "exec"ed command.

Resolves #2609

											
										
										
											2015-12-15 01:21:43 +00:00
+								    restore_term_mode();
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								    // Bounce to launch_process. This never returns.
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								    safe_launch_process(p, actual_cmd.c_str(), argv, envp);
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								}
-												Allow posix_spawn more often

Now that we no longer open files after fork, we can correctly report errors
for failed file opens. So allow posix_spawn even if there's redirections.

											
										
										
											2019-01-29 08:40:55 +00:00
+								// Returns whether we can use posix spawn for a given process in a given job.
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								//
-												Allow posix_spawn more often

Now that we no longer open files after fork, we can correctly report errors
for failed file opens. So allow posix_spawn even if there's redirections.

											
										
										
											2019-01-29 08:40:55 +00:00
+								// To avoid the race between the caller calling tcsetpgrp() and the client checking the
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								// foreground process group, we don't use posix_spawn if we're going to foreground the process. (If
 								// we use fork(), we can call tcsetpgrp after the fork, before the exec, and avoid the race).
-												Correctly handle "self fd redirections"

This adds a test for the obscure case where an fd is redirected to
itself. This is tricky because the dup2 will not clear the CLO_EXEC bit.
So do it manually; also posix_spawn can't be used in this case.

											
										
										
											2019-12-14 00:51:49 +00:00
+								static bool can_use_posix_spawn_for_job(const std::shared_ptr<job_t> &job,
 								                                        const dup2_list_t &dup2s) {
-												Clean up use_posix_spawn

Switch from a global variable to a real function. Make the value atomic.
Clean up handle_fish_use_posix_spawn_change().

											
										
										
											2021-05-31 19:34:43 +00:00
+								    // Is it globally disabled?
 								    if (!get_use_posix_spawn()) return false;
-												Correctly handle "self fd redirections"

This adds a test for the obscure case where an fd is redirected to
itself. This is tricky because the dup2 will not clear the CLO_EXEC bit.
So do it manually; also posix_spawn can't be used in this case.

											
										
										
											2019-12-14 00:51:49 +00:00
+								    // Hack - do not use posix_spawn if there are self-fd redirections.
 								    // For example if you were to write:
 								    //   cmd 6< /dev/null
 								    // it is possible that the open() of /dev/null would result in fd 6. Here even if we attempted
 								    // to add a dup2 action, it would be ignored and the CLO_EXEC bit would remain. So don't use
 								    // posix_spawn in this case; instead we'll call fork() and clear the CLO_EXEC bit manually.
 								    for (const auto &action : dup2s.get_actions()) {
 								        if (action.src == action.target) return false;
 								    }
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								    if (job->group->wants_terminal()) {
 								        // This job will be foregrounded, so we will call tcsetpgrp(), therefore do not use
 								        // posix_spawn.
 								        return false;
-												Don't use posix_spawn for commands that need to be put into foreground to avoid a race
Fix for race where a command's output may not be fully drained

											
										
										
											2012-11-04 23:45:52 +00:00
+								    }
-												Allow posix_spawn more often

Now that we no longer open files after fork, we can correctly report errors
for failed file opens. So allow posix_spawn even if there's redirections.

											
										
										
											2019-01-29 08:40:55 +00:00
+								    return true;
-												Don't use posix_spawn when file redirections are involved (except /dev/null) because the error handling is too difficult
Fix exec to correctly handle the case where a pid could not be created due to posix_spawn failing
Should fix https://github.com/fish-shell/fish-shell/issues/364

											
										
										
											2012-10-29 08:45:51 +00:00
+								}
-												Rationalize a bit of how failed exec() works

We don't need to mark the job as completed in this case, because the
caller will remove the job.

											
										
										
											2020-01-13 22:18:43 +00:00
+								static void internal_exec(env_stack_t &vars, job_t *j, const io_chain_t &block_io) {
-												Split internal_exec to its own function

											
										
										
											2017-07-30 22:26:41 +00:00
+								    // Do a regular launch -  but without forking first...
-												Clean up how pipe fd avoidance works

fish has to ensure that the pipes it creates do not conflict with any
explicit fds named in redirections. Switch this code to using
autoclose_fd_t to make the ownership logic more explicit, and also
introduce fd_set_t to reduce the dependence on io_chain_t.

											
										
										
											2019-12-12 22:42:03 +00:00
+								    process_t *p = j->processes.front().get();
 								    io_chain_t all_ios = block_io;
-												Switch io_file_t to store an fd, not a path

Prior to this fix, a file redirection was turned into an io_file_t. This is
annoying because every place where we want to apply the redirection, we
might fail due to open() failing. Switch to opening the file at the point
we resolve the redirection spec. This will simplify a lot of code.

											
										
										
											2019-12-13 01:27:48 +00:00
+								    if (!all_ios.append_from_specs(p->redirection_specs(), vars.get_pwd_slash())) {
-												Introduce redirection_spec_t

Prior to this change, a process after it has been constructed by
parse_execution, but before it is executed, was given a list of
io_data_t redirections. The problem is that redirections have a
sensitive ownership policy because they hold onto fds. This made it
rather hard to reason about fd lifetime.

Change these to redirection_spec_t. This is a textual description
of a redirection after expansion. It does not represent an open file and
so its lifetime is no longer important.

This enables files to be held only on the stack, and are no longer owned
by a process of indeterminate lifetime.

											
										
										
											2019-12-13 00:44:24 +00:00
+								        return;
 								    }
-												Split internal_exec to its own function

											
										
										
											2017-07-30 22:26:41 +00:00
-												Rename setup_child_process to child_setup_process

Try to name all functions called after fork with "child" prefix.

											
										
										
											2019-06-22 22:10:54 +00:00
+								    // child_setup_process makes sure signals are properly set up.
-												dup2_list_t::resolve_chain to stop returning maybe

It can no longer fail.

											
										
										
											2019-12-29 22:49:05 +00:00
+								    dup2_list_t redirs = dup2_list_t::resolve_chain(all_ios);
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								    if (child_setup_process(false /* not claim_tty */, *j, false /* not is_forked */, redirs) ==
 ) {
-												Revert "Non-exported vars: rename SHLVL to shlvl"

Duh, of course it is exported.

This reverts commit 5fc17dcc826fd8fe7562c4b8293bff1e31472744.

											
										
										
											2017-10-15 11:37:34 +00:00
+								        // Decrement SHLVL as we're removing ourselves from the shell "stack".
-												Don't touch $SHLVL if not interactive

It's not super clear what $SHLVL is useful for, but the current
definition is essentially
"number of shells in the parent processes + 1"

which isn't *super useful*?

Bash's behavior here is a bit weird in that it increments $SHLVL
basically always, but since it auto-execs the last process it will
decrement it again, so in practice it's often not incremented.

E.g.

```
> echo $SHLVL
1
> bash -c 'echo $SHLVL; bash'
2
>> echo $SHLVL
2
```

Both bashes here end up having the same $SHLVL because this is
equivalent to `echo $SHLVL; exec bash`. Running `echo $SHLVL` and then
`bash -c 'echo $SHLVL'` in an interactive bash will have a different
result (1 and 2) because that doesn't *exec* the inner bash.

That's not something we want to get into, so what we do is increment
$SHLVL in every interactive fish. Non-interactive fish will simply
import the existing value.

That means if you had e.g. a bash that runs a fish script that ends up
opening a new fish session, you would have a $SHLVL of *2* - one for the
bash, and one for the inner fish.

We key this off is_interactive_session() (which can also be enabled
via `fish -i`) because it's easy and because `fish -i` is asking for
fish to be, in some form, "interactive".

That means most of the time $SHLVL will be "how many shells am I deep,
how often do I have to `exit`", except for when you specifically asked
for a fish to be "interactive". If that's a problem, we can rethink it.

Fixes #7864.

											
										
										
											2021-03-29 15:35:55 +00:00
+								        if (is_interactive_session()) {
 								            auto shlvl_var = vars.get(L"SHLVL", ENV_GLOBAL | ENV_EXPORT);
 								            wcstring shlvl_str = L"0";
 								            if (shlvl_var) {
 								                long shlvl = fish_wcstol(shlvl_var->as_string().c_str());
 								                if (!errno && shlvl > 0) {
 								                    shlvl_str = to_string(shlvl - 1);
 								                }
-												Split internal_exec to its own function

											
										
										
											2017-07-30 22:26:41 +00:00
+								            }
-												Don't touch $SHLVL if not interactive

It's not super clear what $SHLVL is useful for, but the current
definition is essentially
"number of shells in the parent processes + 1"

which isn't *super useful*?

Bash's behavior here is a bit weird in that it increments $SHLVL
basically always, but since it auto-execs the last process it will
decrement it again, so in practice it's often not incremented.

E.g.

```
> echo $SHLVL
1
> bash -c 'echo $SHLVL; bash'
2
>> echo $SHLVL
2
```

Both bashes here end up having the same $SHLVL because this is
equivalent to `echo $SHLVL; exec bash`. Running `echo $SHLVL` and then
`bash -c 'echo $SHLVL'` in an interactive bash will have a different
result (1 and 2) because that doesn't *exec* the inner bash.

That's not something we want to get into, so what we do is increment
$SHLVL in every interactive fish. Non-interactive fish will simply
import the existing value.

That means if you had e.g. a bash that runs a fish script that ends up
opening a new fish session, you would have a $SHLVL of *2* - one for the
bash, and one for the inner fish.

We key this off is_interactive_session() (which can also be enabled
via `fish -i`) because it's easy and because `fish -i` is asking for
fish to be, in some form, "interactive".

That means most of the time $SHLVL will be "how many shells am I deep,
how often do I have to `exit`", except for when you specifically asked
for a fish to be "interactive". If that's a problem, we can rethink it.

Fixes #7864.

											
										
										
											2021-03-29 15:35:55 +00:00
+								            vars.set_one(L"SHLVL", ENV_GLOBAL | ENV_EXPORT, std::move(shlvl_str));
-												Split internal_exec to its own function

											
										
										
											2017-07-30 22:26:41 +00:00
+								        }
 								        // launch_process _never_ returns.
-												Clean up how pipe fd avoidance works

fish has to ensure that the pipes it creates do not conflict with any
explicit fds named in redirections. Switch this code to using
autoclose_fd_t to make the ownership logic more explicit, and also
introduce fd_set_t to reduce the dependence on io_chain_t.

											
										
										
											2019-12-12 22:42:03 +00:00
+								        launch_process_nofork(vars, p);
-												Split internal_exec to its own function

											
										
										
											2017-07-30 22:26:41 +00:00
+								    }
 								}
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								/// Construct an internal process for the process p. In the background, write the data \p outdata to
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								/// stdout and \p errdata to stderr, respecting the io chain \p ios. For example if target_fd is 1
 								/// (stdout), and there is a dup2 3->1, then we need to write to fd 3. Then exit the internal
 								/// process.
-												Factor internal process short-circuiting together

When executing a buffered block or builtin, the usual approach is to
execute, collect output in a string, and then output that string to
stdout or whatever the redirections say. Similarly for stderr.

If we get no output, then we can elide the outputting which means
skipping the background thread. In this case we just mark the process as
finished immediately.

We do this in multiple locations which is confusing. Factor them all
together into a new function run_internal_process_or_short_circuit.

											
										
										
											2020-01-13 22:46:31 +00:00
+								static void run_internal_process(process_t *p, std::string &&outdata, std::string &&errdata,
-												[clang-tidy] Add several references

Found with performance-unnecessary-value-param

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-12-27 05:54:21 +00:00
+								                                 const io_chain_t &ios) {
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								    p->check_generations_before_launch();
 								    // We want both the dup2s and the io_chain_ts to be kept alive by the background thread, because
 								    // they may own an fd that we want to write to. Move them all to a shared_ptr. The strings as
 								    // well (they may be long).
 								    // Construct a little helper struct to make it simpler to move into our closure without copying.
 								    struct write_fields_t {
 								        int src_outfd{-1};
 								        std::string outdata{};
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								        int src_errfd{-1};
 								        std::string errdata{};
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								        io_chain_t ios{};
 								        maybe_t<dup2_list_t> dup2s{};
 								        std::shared_ptr<internal_proc_t> internal_proc{};
-												Introduce proc_status_t

In fish we play fast and loose with status codes as set directly (e.g. on
failed redirections), vs status codes returned from waitpid(), versus the
value $status. Introduce a new value type proc_status_t to encapsulate
this logic.

											
										
										
											2019-02-25 18:05:42 +00:00
+								        proc_status_t success_status{};
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
 								        bool skip_out() const { return outdata.empty() || src_outfd < 0; }
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
 								        bool skip_err() const { return errdata.empty() || src_errfd < 0; }
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								    };
 								    auto f = std::make_shared<write_fields_t>();
 								    f->outdata = std::move(outdata);
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								    f->errdata = std::move(errdata);
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
 								    // Construct and assign the internal process to the real process.
 								    p->internal_proc_ = std::make_shared<internal_proc_t>();
 								    f->internal_proc = p->internal_proc_;
-												Widen the rest of the FLOGs

Fixes #5900.

											
										
										
											2019-05-30 11:04:40 +00:00
+								    FLOGF(proc_internal_proc, L"Created internal proc %llu to write output for proc '%ls'",
-												Add some FLOG logging around internal processes

											
										
										
											2019-05-28 16:38:45 +00:00
+								          p->internal_proc_->get_id(), p->argv0());
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								    // Resolve the IO chain.
 								    // Note it's important we do this even if we have no out or err data, because we may have been
 								    // asked to truncate a file (e.g. `echo -n '' > /tmp/truncateme.txt'). The open() in the dup2
 								    // list resolution will ensure this happens.
 								    f->dup2s = dup2_list_t::resolve_chain(ios);
 								    // Figure out which source fds to write to. If they are closed (unlikely) we just exit
 								    // successfully.
 								    f->src_outfd = f->dup2s->fd_for_target_fd(STDOUT_FILENO);
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								    f->src_errfd = f->dup2s->fd_for_target_fd(STDERR_FILENO);
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
-												Introduce proc_status_t

In fish we play fast and loose with status codes as set directly (e.g. on
failed redirections), vs status codes returned from waitpid(), versus the
value $status. Introduce a new value type proc_status_t to encapsulate
this logic.

											
										
										
											2019-02-25 18:05:42 +00:00
+								    // If we have nothing to write we can elide the thread.
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								    // TODO: support eliding output to /dev/null.
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								    if (f->skip_out() && f->skip_err()) {
-												Don't override exit status when stderr is closed by `2>&-`

fixes #6470

											
										
										
											2020-01-07 12:48:57 +00:00
+								        f->internal_proc->mark_exited(p->status);
-												run_internal_process can no longer fail, remove its bool return

											
										
										
											2020-01-13 22:40:24 +00:00
+								        return;
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								    }
 								    // Ensure that ios stays alive, it may own fds.
 								    f->ios = ios;
 								    // If our process is a builtin, it will have already set its status value. Make sure we
 								    // propagate that if our I/O succeeds and don't read it on a background thread. TODO: have
 								    // builtin_run provide this directly, rather than setting it in the process.
 								    f->success_status = p->status;
-												Add a cant_wait parameter to iothread_perform

Sometimes we must spawn a new thread, to avoid the risk of deadlock.
Ensure we always spawn a thread in those cases. In particular this
includes the fillthread.

											
										
										
											2020-01-18 19:32:44 +00:00
+								    iothread_perform_cantwait([f]() {
-												Introduce proc_status_t

In fish we play fast and loose with status codes as set directly (e.g. on
failed redirections), vs status codes returned from waitpid(), versus the
value $status. Introduce a new value type proc_status_t to encapsulate
this logic.

											
										
										
											2019-02-25 18:05:42 +00:00
+								        proc_status_t status = f->success_status;
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								        if (!f->skip_out()) {
 								            ssize_t ret = write_loop(f->src_outfd, f->outdata.data(), f->outdata.size());
 								            if (ret < 0) {
 								                if (errno != EPIPE) {
 								                    wperror(L"write");
 								                }
-												Introduce proc_status_t

In fish we play fast and loose with status codes as set directly (e.g. on
failed redirections), vs status codes returned from waitpid(), versus the
value $status. Introduce a new value type proc_status_t to encapsulate
this logic.

											
										
										
											2019-02-25 18:05:42 +00:00
+								                if (status.is_success()) {
 								                    status = proc_status_t::from_exit_code(1);
 								                }
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								            }
 								        }
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								        if (!f->skip_err()) {
 								            ssize_t ret = write_loop(f->src_errfd, f->errdata.data(), f->errdata.size());
 								            if (ret < 0) {
 								                if (errno != EPIPE) {
 								                    wperror(L"write");
 								                }
-												Introduce proc_status_t

In fish we play fast and loose with status codes as set directly (e.g. on
failed redirections), vs status codes returned from waitpid(), versus the
value $status. Introduce a new value type proc_status_t to encapsulate
this logic.

											
										
										
											2019-02-25 18:05:42 +00:00
+								                if (status.is_success()) {
 								                    status = proc_status_t::from_exit_code(1);
 								                }
-												Use internal processes to write builtin output

This uses the new internal process mechanism to write output for builtins.
After this the only reason fish ever forks is to execute external processes.

											
										
										
											2019-02-13 23:17:18 +00:00
+								            }
 								        }
-												Use "internal" processes to write buffered output

This introduces "internal processes" which are backed by a pthread instead
of a normal process. Internal processes are reaped using the topic
machinery, plugging in neatly alongside the sigchld topic; this means that
process_mark_finished_children() can wait for internal and external
processes simultaneously.

Initially internal processes replace the forked process that fish uses to
write out the output of blocks and functions.

											
										
										
											2019-02-13 23:17:07 +00:00
+								        f->internal_proc->mark_exited(status);
 								    });
 								}
-												Factor internal process short-circuiting together

When executing a buffered block or builtin, the usual approach is to
execute, collect output in a string, and then output that string to
stdout or whatever the redirections say. Similarly for stderr.

If we get no output, then we can elide the outputting which means
skipping the background thread. In this case we just mark the process as
finished immediately.

We do this in multiple locations which is confusing. Factor them all
together into a new function run_internal_process_or_short_circuit.

											
										
										
											2020-01-13 22:46:31 +00:00
+								/// If \p outdata or \p errdata are both empty, then mark the process as completed immediately.
 								/// Otherwise, run an internal process.
 								static void run_internal_process_or_short_circuit(parser_t &parser, const std::shared_ptr<job_t> &j,
 								                                                  process_t *p, std::string &&outdata,
 								                                                  std::string &&errdata, const io_chain_t &ios) {
 								    if (outdata.empty() && errdata.empty()) {
 								        p->completed = true;
 								        if (p->is_last_in_job) {
 								            FLOGF(exec_job_status, L"Set status of job %d (%ls) to %d using short circuit",
 								                  j->job_id(), j->preview().c_str(), p->status);
-												Change builtins to return maybe_t<int> instead of int

											
										
										
											2020-07-18 17:25:43 +00:00
+								            auto statuses = j->get_statuses();
 								            if (statuses) {
 								                parser.set_last_statuses(statuses.value());
 								                parser.libdata().status_count++;
-												Return no status from successful variable assignments

											
										
										
											2020-08-02 20:31:00 +00:00
+								            } else if (j->flags().negate) {
 								                // Special handling for `not set var (substitution)`.
 								                // If there is no status, but negation was requested,
 								                // take the last status and negate it.
 								                auto last_statuses = parser.get_last_statuses();
 								                last_statuses.status = !last_statuses.status;
 								                parser.set_last_statuses(last_statuses);
-												Change builtins to return maybe_t<int> instead of int

											
										
										
											2020-07-18 17:25:43 +00:00
+								            }
-												Factor internal process short-circuiting together

When executing a buffered block or builtin, the usual approach is to
execute, collect output in a string, and then output that string to
stdout or whatever the redirections say. Similarly for stderr.

If we get no output, then we can elide the outputting which means
skipping the background thread. In this case we just mark the process as
finished immediately.

We do this in multiple locations which is confusing. Factor them all
together into a new function run_internal_process_or_short_circuit.

											
										
										
											2020-01-13 22:46:31 +00:00
+								        }
 								    } else {
 								        run_internal_process(p, std::move(outdata), std::move(errdata), ios);
 								    }
 								}
-												Ignore SIGINT and SIGQUIT in non-interactive background processes

Fixes #6828

											
										
										
											2020-04-05 08:24:26 +00:00
+								bool blocked_signals_for_job(const job_t &job, sigset_t *sigmask) {
 								    // Block some signals in background jobs for which job control is turned off (#6828).
 								    if (!job.is_foreground() && !job.wants_job_control()) {
 								        sigaddset(sigmask, SIGINT);
 								        sigaddset(sigmask, SIGQUIT);
 								        return true;
 								    }
 								    return false;
 								}
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								/// Call fork() as part of executing a process \p p in a job \j. Execute \p child_action in the
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								/// context of the child.
 								static launch_result_t fork_child_for_process(const std::shared_ptr<job_t> &job, process_t *p,
 								                                              const dup2_list_t &dup2s, const char *fork_type,
 								                                              const std::function<void()> &child_action) {
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								    // Claim the tty from fish, if the job wants it and we are the pgroup leader.
 								    pid_t claim_tty_from =
 								        (p->leads_pgrp && job->group->wants_terminal()) ? getpgrp() : INVALID_PID;
-												Bravely remove reclaim... param from continue_job, and rework tcsetpgrp calls

This changes how fish attempts to protect itself from calling tcsetpgrp() too
aggressively. Recall that tcsetpgrp() will "force" itself, if SIGTTOU is
ignored (which it is in fish when job control is enabled).

Prior to this fix, we avoided SIGTTINs by only transferring the tty ownership
if fish was already the owner. This dated from a time before we had really
nailed down how pgroups should be assigned. Now we more deliberately assign a
job's pgroup so we don't need this conservative check.

However we still need logic to avoid transferring the tty if fish is not the
owner. The bad case is when job control is enabled while fish is running in the
background - here fish would transfer the tty and "steal" from the foreground
process.

So retain the checks of the current tty owner but migrate them to the point of
calling tcsetpgrp() itself.

											
										
										
											2020-07-27 00:55:00 +00:00
-												Remove the wait_for_threads_to_die parameter to execute_fork

This is always set to false so we can get rid of it.

											
										
										
											2019-11-23 20:36:44 +00:00
+								    pid_t pid = execute_fork();
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								    if (pid < 0) {
 								        return launch_result_t::failed;
 								    }
 								    const bool is_parent = (pid > 0);
 								    // Record the pgroup if this is the leader.
 								    // Both parent and child attempt to send the process to its new group, to resolve the race.
 								    p->pid = is_parent ? pid : getpid();
 								    if (p->leads_pgrp) {
 								        job->group->set_pgid(p->pid);
 								    }
 								    if (auto pgid = job->group->get_pgid()) {
 								        if (int err = execute_setpgid(p->pid, *pgid, is_parent)) {
 								            report_setpgid_error(err, is_parent, *pgid, job.get(), p);
-												Migrate job pgid from job to job tree

Prior to this, jobs all had a pgid, and fish has to work hard to ensure
that pgids were inherited properly for nested jobs. But now the job tree
is the source of truth and there is only one location for the pgid.

											
										
										
											2020-05-29 21:51:48 +00:00
+								        }
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    }
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								    if (!is_parent) {
 								        // Child process.
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								        child_setup_process(claim_tty_from, *job, true, dup2s);
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								        child_action();
 								        DIE("Child process returned control to fork_child lambda!");
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    }
-												decrease scope of a couple variables, prefix incr non-primitives

											
										
										
											2022-04-07 16:24:39 +00:00
+								    ++s_fork_count;
-												Clean up g_fork_count

Make it static and atomic

											
										
										
											2019-06-03 19:58:35 +00:00
+								    FLOGF(exec_fork, L"Fork #%d, pid %d: %s for '%ls'", int(s_fork_count), pid, fork_type,
 								          p->argv0());
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    return launch_result_t::ok;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								}
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								/// \return an newly allocated output stream for the given fd, which is typically stdout or stderr.
 								/// This inspects the io_chain and decides what sort of output stream to return.
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								/// If \p piped_output_needs_buffering is set, and if the output is going to a pipe, then the other
 								/// end then synchronously writing to the pipe risks deadlock, so we must buffer it.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								static std::shared_ptr<output_stream_t> create_output_stream_for_builtin(
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								    int fd, const io_chain_t &io_chain, bool piped_output_needs_buffering) {
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								    using std::make_shared;
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								    const shared_ptr<const io_data_t> io = io_chain.io_for_fd(fd);
 								    if (io == nullptr) {
 								        // Common case of no redirections.
 								        // Just write to the fd directly.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								        return make_shared<fd_output_stream_t>(fd);
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								    }
 								    switch (io->io_mode) {
-												builtins to write to buffers directly

This concerns builtins writing to an io_buffer_t. io_buffer_t is how fish
captures output, especially in command substitutions:

    set STUFF (string upper stuff)

Recall that io_buffer_t fills itself by reading from an fd (typically
connected to stdout of the command). However if our command is a builtin,
then we can write to the buffer directly.

Prior to this change, when a builtin anticipated writing to an
io_buffer_t, it would first write into an internal buffer, and then after
the builtin was finished, we would copy it to the io_buffer_t. This was
because we didn't have a polymorphic receiver for builtin output: we
always buffered it and then directed it to the io_buffer_t or file
descriptor or stdout or whatever.

Now that we have polymorphpic io_streams_t, we can notice ahead of time
that the builtin output is destined for an internal buffer and have it
just write directly to that buffer. This saves a buffering step, which is
a nice simplification.

											
										
										
											2021-02-04 23:18:34 +00:00
+								        case io_mode_t::bufferfill: {
 								            // Our IO redirection is to an internal buffer, e.g. a command substitution.
 								            // We will write directly to it.
 								            std::shared_ptr<io_buffer_t> buffer =
-												Switch a cast from C style to C++ style

											
										
										
											2021-03-28 22:17:44 +00:00
+								                std::static_pointer_cast<const io_bufferfill_t>(io)->buffer();
-												builtins to write to buffers directly

This concerns builtins writing to an io_buffer_t. io_buffer_t is how fish
captures output, especially in command substitutions:

    set STUFF (string upper stuff)

Recall that io_buffer_t fills itself by reading from an fd (typically
connected to stdout of the command). However if our command is a builtin,
then we can write to the buffer directly.

Prior to this change, when a builtin anticipated writing to an
io_buffer_t, it would first write into an internal buffer, and then after
the builtin was finished, we would copy it to the io_buffer_t. This was
because we didn't have a polymorphic receiver for builtin output: we
always buffered it and then directed it to the io_buffer_t or file
descriptor or stdout or whatever.

Now that we have polymorphpic io_streams_t, we can notice ahead of time
that the builtin output is destined for an internal buffer and have it
just write directly to that buffer. This saves a buffering step, which is
a nice simplification.

											
										
										
											2021-02-04 23:18:34 +00:00
+								            return make_unique<buffered_output_stream_t>(buffer);
 								        }
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
 								        case io_mode_t::close:
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            // Like 'echo foo >&-'
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								            return make_shared<null_output_stream_t>();
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
 								        case io_mode_t::file:
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            // Output is to a file which has been opened.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								            return make_shared<fd_output_stream_t>(io->source_fd);
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								        case io_mode_t::pipe:
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            // Output is to a pipe. We may need to buffer.
 								            if (piped_output_needs_buffering) {
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								                return make_shared<string_output_stream_t>();
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            } else {
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								                return make_shared<fd_output_stream_t>(io->source_fd);
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            }
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								        case io_mode_t::fd:
-												builtins to sometimes not buffer when writing to a pipe

Prior to this change, if you pipe a builtin to another process, it would
be buffered. With this fix the builtin will write directly to the pipe if
safe (that is, if the other end of the pipe is owned by some external
process that has been launched).

Most builtins do not produce a lot of output so this is somewhat tricky to
reproduce, but it can be done like so:

     bash -c 'for i in {1..500}; do echo $i ; sleep .5; done' |
	   string match --regex '[02468]' |
	   cat

Here 'string match' is filtering out numbers which contain no even digits.
With this change, the numbers are printed as they come, instead of
buffering all the output.

Note that bcfc54fdaa2f0f76a6d7e20 fixed this for the case where the
builtin outputs to stdout directly. This fix extends it to all pipelines
that include only one fish internal process.

											
										
										
											2021-02-08 21:53:53 +00:00
+								            // This is a case like 'echo foo >&5'
 								            // It's uncommon and unclear what should happen.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								            return make_shared<string_output_stream_t>();
-												Do not buffer builtin output if avoidable

builtins output to stdout and stderr via io_streams_t. Prior to this fix, it
contained an output_stream_t which just wraps a buffer. So all builtin output
went to this buffer (except for eval).

Switch output_stream_t to become a new abstract class which can output to a
buffer, file descriptor, or nowhere. This allows for example `string` to stream
its output as it is produced, instead of buffering it.

											
										
										
											2020-07-29 23:03:29 +00:00
+								    }
 								    DIE("Unreachable");
 								}
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								/// Handle output from a builtin, by printing the contents of builtin_io_streams to the redirections
 								/// given in io_chain.
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								static void handle_builtin_output(parser_t &parser, const std::shared_ptr<job_t> &j, process_t *p,
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								                                  const io_chain_t &io_chain, const output_stream_t &out,
 								                                  const output_stream_t &err) {
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								    assert(p->type == process_type_t::builtin && "Process is not a builtin");
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
-												builtins to write to buffers directly

This concerns builtins writing to an io_buffer_t. io_buffer_t is how fish
captures output, especially in command substitutions:

    set STUFF (string upper stuff)

Recall that io_buffer_t fills itself by reading from an fd (typically
connected to stdout of the command). However if our command is a builtin,
then we can write to the buffer directly.

Prior to this change, when a builtin anticipated writing to an
io_buffer_t, it would first write into an internal buffer, and then after
the builtin was finished, we would copy it to the io_buffer_t. This was
because we didn't have a polymorphic receiver for builtin output: we
always buffered it and then directed it to the io_buffer_t or file
descriptor or stdout or whatever.

Now that we have polymorphpic io_streams_t, we can notice ahead of time
that the builtin output is destined for an internal buffer and have it
just write directly to that buffer. This saves a buffering step, which is
a nice simplification.

											
										
										
											2021-02-04 23:18:34 +00:00
+								    // Figure out any data remaining to write. We may have none, in which case we can short-circuit.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								    std::string outbuff = wcs2string(out.contents());
 								    std::string errbuff = wcs2string(err.contents());
-												Refactor job control to make functions act like their names imply

The job control functions were a bit messy, in particular
`set_child_group`'s name would imply that all it does is set the child
group, but in reality it used to set the child group (via `setpgid`),
set the job's pgrp if it hasn't been set, and possibly assign control of
the terminal to the newly-created job.

These have been split into separate functions. Now `set_child_group`
does just (and only) that, `maybe_assign_terminal` might assign the
terminal to the new pgrp, and `on_process_created` is used to set the
job properties the first time an external process is created. This might
also speed things up (but probably not noticeably) as there are no more
repeated calls to `getpgrp()` if JOB_CONTROL is not set.

Additionally, this closes #4715 by no longer unconditionally calling
`setpgid` on all new processes, including those created by `posix_spawn`
which does not need this since the child's pgrep is set at in the
arguments to that API call.

											
										
										
											2018-02-15 01:08:12 +00:00
-												Move some fflushes around in handle_builtin_output

											
										
										
											2020-01-13 22:29:58 +00:00
+								    // Some historical behavior.
 								    if (!outbuff.empty()) fflush(stdout);
 								    if (!errbuff.empty()) fflush(stderr);
-												Factor internal process short-circuiting together

When executing a buffered block or builtin, the usual approach is to
execute, collect output in a string, and then output that string to
stdout or whatever the redirections say. Similarly for stderr.

If we get no output, then we can elide the outputting which means
skipping the background thread. In this case we just mark the process as
finished immediately.

We do this in multiple locations which is confusing. Factor them all
together into a new function run_internal_process_or_short_circuit.

											
										
										
											2020-01-13 22:46:31 +00:00
+								    // Construct and run our background process.
 								    run_internal_process_or_short_circuit(parser, j, p, std::move(outbuff), std::move(errbuff),
-												handle_builtin_output to take io_chain by const reference

There was no reason for this to be a pointer or mutable.

											
										
										
											2021-02-14 04:05:33 +00:00
+								                                          io_chain);
-												Refactor job control to make functions act like their names imply

The job control functions were a bit messy, in particular
`set_child_group`'s name would imply that all it does is set the child
group, but in reality it used to set the child group (via `setpgid`),
set the job's pgrp if it hasn't been set, and possibly assign control of
the terminal to the newly-created job.

These have been split into separate functions. Now `set_child_group`
does just (and only) that, `maybe_assign_terminal` might assign the
terminal to the new pgrp, and `on_process_created` is used to set the
job properties the first time an external process is created. This might
also speed things up (but probably not noticeably) as there are no more
repeated calls to `getpgrp()` if JOB_CONTROL is not set.

Additionally, this closes #4715 by no longer unconditionally calling
`setpgid` on all new processes, including those created by `posix_spawn`
which does not need this since the child's pgrep is set at in the
arguments to that API call.

											
										
										
											2018-02-15 01:08:12 +00:00
+								}
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								/// Executes an external command.
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								/// An error return here indicates that the process failed to launch, and the rest of
 								/// the pipeline should be cancelled.
 								static launch_result_t exec_external_command(parser_t &parser, const std::shared_ptr<job_t> &j,
 								                                             process_t *p, const io_chain_t &proc_io_chain) {
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								    assert(p->type == process_type_t::external && "Process is not external");
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    // Get argv and envv before we fork.
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								    const std::vector<std::string> narrow_argv = wide_string_list_to_narrow(p->argv());
 								    null_terminated_array_t<char> argv_array(narrow_argv);
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
-												Adopt dup2_list_t in fork execution path

This switches IO redirections after fork() to use the dup2_list_t,
instead of io_chain_t. This results in simpler code with much simpler
error handling.

											
										
										
											2019-01-28 22:35:56 +00:00
+								    // Convert our IO chain to a dup2 sequence.
 								    auto dup2s = dup2_list_t::resolve_chain(proc_io_chain);
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								    // Ensure that stdin is blocking before we hand it off (see issue #176).
 								    // Note this will also affect stdout and stderr if they refer to the same tty.
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    make_fd_blocking(STDIN_FILENO);
-												Eliminate reader_current_filename

Store this in the parser libdata instead.

											
										
										
											2019-05-22 20:34:03 +00:00
+								    auto export_arr = parser.vars().export_arr();
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    const char *const *argv = argv_array.get();
-												Reimplement the whole variable stack

The variable stack is a mess - confused locking, surprising callouts, and
unclear division of labor. Just reimplement the whole thing.

											
										
										
											2019-05-10 16:10:43 +00:00
+								    const char *const *envv = export_arr->get();
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
 								    std::string actual_cmd_str = wcs2string(p->actual_cmd);
 								    const char *actual_cmd = actual_cmd_str.c_str();
-												Eliminate reader_current_filename

Store this in the parser libdata instead.

											
										
										
											2019-05-22 20:34:03 +00:00
+								    const wchar_t *file = parser.libdata().current_filename;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
 								#if FISH_USE_POSIX_SPAWN
 								    // Prefer to use posix_spawn, since it's faster on some systems like OS X.
-												Clean up use_posix_spawn

Switch from a global variable to a real function. Make the value atomic.
Clean up handle_fish_use_posix_spawn_change().

											
										
										
											2021-05-31 19:34:43 +00:00
+								    if (can_use_posix_spawn_for_job(j, dup2s)) {
-												decrease scope of a couple variables, prefix incr non-primitives

											
										
										
											2022-04-07 16:24:39 +00:00
+								        ++s_fork_count;  // spawn counts as a fork+exec
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
-												Clean up posix_spawn code paths

Prior to this change, the posix_spawn code paths used a fair amount of
manual management around its allocated structures (attrs and file actions).
Encapsulate this into a new class that manages memory management and error
handling.

											
										
										
											2020-06-09 21:56:03 +00:00
+								        posix_spawner_t spawner(j.get(), dup2s);
 								        maybe_t<pid_t> pid = spawner.spawn(actual_cmd, const_cast<char *const *>(argv),
 								                                           const_cast<char *const *>(envv));
 								        if (int err = spawner.get_error()) {
 								            safe_report_exec_error(err, actual_cmd, argv, envv);
-												Rationalize exit codes for failed execs

This cleans up some exit code processing. Previously a failed exec
would produce exit code 125 unconditionally, while a failed posix_spawn
would produce exit code 1 (!).

With this change, fish reports exit code 126 for not-executable, and 127
for file-not-found. This matches bash.

											
										
										
											2021-03-28 04:21:29 +00:00
+								            p->status = proc_status_t::from_exit_code(exit_code_from_exec_error(err));
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								            return launch_result_t::failed;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								        }
-												Clean up posix_spawn code paths

Prior to this change, the posix_spawn code paths used a fair amount of
manual management around its allocated structures (attrs and file actions).
Encapsulate this into a new class that manages memory management and error
handling.

											
										
										
											2020-06-09 21:56:03 +00:00
+								        assert(pid.has_value() && *pid > 0 && "Should have either a valid pid, or an error");
 								        // This usleep can be used to test for various race conditions
 								        // (https://github.com/fish-shell/fish-shell/issues/360).
 								        // usleep(10000);
 								        FLOGF(exec_fork, L"Fork #%d, pid %d: spawn external command '%s' from '%ls'",
 								              int(s_fork_count), *pid, actual_cmd, file ? file : L"<no file>");
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
 								        // these are all things do_fork() takes care of normally (for forked processes):
-												Clean up posix_spawn code paths

Prior to this change, the posix_spawn code paths used a fair amount of
manual management around its allocated structures (attrs and file actions).
Encapsulate this into a new class that manages memory management and error
handling.

											
										
										
											2020-06-09 21:56:03 +00:00
+								        p->pid = *pid;
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								        if (p->leads_pgrp) {
 								            j->group->set_pgid(p->pid);
 								            // posix_spawn should in principle set the pgid before returning.
 								            // In glibc, posix_spawn uses fork() and the pgid group is set on the child side;
 								            // therefore the parent may not have seen it be set yet.
 								            // Ensure it gets set. See #4715, also https://github.com/Microsoft/WSL/issues/2997.
 								            execute_setpgid(p->pid, p->pid, true /* is parent */);
 								        }
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        return launch_result_t::ok;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    } else
 								#endif
 								    {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        return fork_child_for_process(j, p, dup2s, "external command",
 								                                      [&] { safe_launch_process(p, actual_cmd, argv, envv); });
-												Factor do_fork into a real function

											
										
										
											2018-09-03 21:33:53 +00:00
+								    }
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								}
-												Make function_prepare_environment take argv instead of the process

This will help concurrent execution.

											
										
										
											2019-11-15 01:58:39 +00:00
+								// Given that we are about to execute a function, push a function block and set up the
-												Refactor function_prepare_environment

Migrate it into exec.cpp to reduce the complexity of
exec_block_or_func_process.

											
										
										
											2019-11-10 22:46:21 +00:00
+								// variable environment.
-												Make function_prepare_environment take argv instead of the process

This will help concurrent execution.

											
										
										
											2019-11-15 01:58:39 +00:00
+								static block_t *function_prepare_environment(parser_t &parser, wcstring_list_t argv,
-												Refactor function_prepare_environment

Migrate it into exec.cpp to reduce the complexity of
exec_block_or_func_process.

											
										
										
											2019-11-10 22:46:21 +00:00
+								                                             const function_properties_t &props) {
 								    // Extract the function name and remaining arguments.
 								    wcstring func_name;
 								    if (!argv.empty()) {
 								        // Extract and remove the function name from argv.
 								        func_name = std::move(*argv.begin());
 								        argv.erase(argv.begin());
 								    }
 								    block_t *fb = parser.push_block(block_t::function_block(func_name, argv, props.shadow_scope));
 								    auto &vars = parser.vars();
 								    // Setup the environment for the function. There are three components of the environment:
 								    // 1. named arguments
 								    // 2. inherited variables
 								    // 3. argv
 								    size_t idx = 0;
 								    for (const wcstring &named_arg : props.named_arguments) {
 								        if (idx < argv.size()) {
 								            vars.set_one(named_arg, ENV_LOCAL | ENV_USER, argv.at(idx));
 								        } else {
 								            vars.set_empty(named_arg, ENV_LOCAL | ENV_USER);
 								        }
 								        idx++;
 								    }
-												Simplify function_info_t and function_data_t

Work towards cleaning up function definition. Migrate inherit_vars into
props and capture their values at the point of definition.

											
										
										
											2019-11-12 17:53:10 +00:00
+								    for (const auto &kv : props.inherit_vars) {
 								        vars.set(kv.first, ENV_LOCAL | ENV_USER, kv.second);
-												Refactor function_prepare_environment

Migrate it into exec.cpp to reduce the complexity of
exec_block_or_func_process.

											
										
										
											2019-11-10 22:46:21 +00:00
+								    }
 								    vars.set_argv(std::move(argv));
 								    return fb;
 								}
 								// Given that we are done executing a function, restore the environment.
 								static void function_restore_environment(parser_t &parser, const block_t *block) {
 								    parser.pop_block(block);
 								    // If we returned due to a return statement, then stop returning now.
 								    parser.libdata().returning = false;
 								}
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								// The "performer" function of a block or function process.
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								// This accepts a place to execute as \p parser and then executes the result, returning a status.
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								// This is factored out in this funny way in preparation for concurrent execution.
-												Collapse a job's "parent stuff" into a new type job_lineage_t

Currently a job needs to know three things about its "parents:"

1. Any IO redirections for the block or function containing this job
2. The pgid for the parent job
3. Whether the parent job has been fully constructed (to defer self-disown)

These are all tracked in somewhat separate awkward ways. Collapse them
into a single new type job_lineage_t.

											
										
										
											2019-12-08 21:03:42 +00:00
+								using proc_performer_t = std::function<proc_status_t(parser_t &parser)>;
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
 								// \return a function which may be to run the given process \p.
 								// May return an empty std::function in the rare case that the to-be called fish function no longer
 								// exists. This is just a dumb artifact of the fact that we only capture the functions name, not its
 								// properties, when creating the job; thus a race could delete the function before we fetch its
 								// properties.
-												Introduce the internal jobs for functions

This PR is aimed at improving how job ids are assigned. In particular,
previous to this commit, a job id would be consumed by functions (and
thus aliases). Since it's usual to use functions as command wrappers
this results in awkward job id assignments.

For example if the user is like me and just made the jump from vim -> neovim
then the user might create the following alias:
```
alias vim=nvim
```
Previous to this commit if the user ran `vim` after setting up this
alias, backgrounded (^Z) and ran `jobs` then the output might be:
```
Job	Group	State	Command
2	60267	stopped	nvim  $argv
```
If the user subsequently opened another vim (nvim) session, backgrounded
and ran jobs then they might see what follows:
```
Job	Group	State	Command
4	70542	stopped	nvim  $argv
2	60267	stopped	nvim  $argv
```
These job ids feel unnatural, especially when transitioning away from
e.g. bash where job ids are sequentially incremented (and aliases/functions
don't consume a job id).

See #6053 for more details.

As @ridiculousfish pointed out in
https://github.com/fish-shell/fish-shell/issues/6053#issuecomment-559899400,
we want to elide a job's job id if it corresponds to a single function in the
foreground. This translates to the following prerequisites:

- A job must correspond to a single process (i.e. the job continuation
    must be empty)
- A job must be in the foreground (i.e. `&` wasn't appended)
- The job's single process must resolve to a function invocation

If all of these conditions are true then we should mark a job as
"internal" and somehow remove it from consideration when any
infrastructure tries to interact with jobs / job ids.

I saw two paths to implement these requirements:

- At the time of job creation calculate whether or not a job is
  "internal" and use a separate list of job ids to track their ids.
  Additionally introduce a new flag denoting that a job is internal so
  that e.g. `jobs` doesn't list internal jobs
  - I started implementing this route but quickly realized I was
    computing the same information that would be computed later on (e.g.
    "is this job a single process" and "is this jobs statement a
    function"). Specifically I was computing data that populate_job_process
    would end up computing later anyway. Additionally this added some
    weird complexities to the job system (after the change there were two
    job id lists AND an additional flag that had to be taken into
    consideration)
- Once a function is about to be executed we release the current jobs
  job id if the prerequisites are satisfied (which at this point have
  been fully computed).
  - I opted for this solution since it seems cleaner. In this
  implementation "releasing a job id" is done by both calling
  `release_job_id` and by marking the internal job_id member variable to
  -1. The former operation allows subsequent child jobs to reuse that
  same job id (so e.g. the situation described in Motivation doesn't
  occur), and the latter ensures that no other job / job id
  infrastructure will interact with these jobs because valid jobs have
  positive job ids. The second operation causes job_id to become
  non-const which leads to the list of code changes outside of `exec.c`
  (i.e. a codemod from `job_t::job_id` -> `job_t::job_id()` and moving the
   old member variable to a non-const private `job_t::job_id_`)

Note: Its very possible I missed something and setting the job id to -1
will break some other infrastructure, please let me know if so!

I tried to run `make/ninja lint`, but a bunch of non-relevant issues
appeared (e.g. `fatal error: 'config.h' file not found`). I did
successfully clang-format (`git clang-format -f`) and run tests, though.
This PR closes #6053.

											
										
										
											2019-12-29 15:46:07 +00:00
+								static proc_performer_t get_performer_for_process(process_t *p, job_t *job,
-												Collapse a job's "parent stuff" into a new type job_lineage_t

Currently a job needs to know three things about its "parents:"

1. Any IO redirections for the block or function containing this job
2. The pgid for the parent job
3. Whether the parent job has been fully constructed (to defer self-disown)

These are all tracked in somewhat separate awkward ways. Collapse them
into a single new type job_lineage_t.

											
										
										
											2019-12-08 21:03:42 +00:00
+								                                                  const io_chain_t &io_chain) {
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								    assert((p->type == process_type_t::function || p->type == process_type_t::block_node) &&
 								           "Unexpected process type");
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								    // We want to capture the job group.
 								    job_group_ref_t job_group = job->group;
-												Collapse a job's "parent stuff" into a new type job_lineage_t

Currently a job needs to know three things about its "parents:"

1. Any IO redirections for the block or function containing this job
2. The pgid for the parent job
3. Whether the parent job has been fully constructed (to defer self-disown)

These are all tracked in somewhat separate awkward ways. Collapse them
into a single new type job_lineage_t.

											
										
										
											2019-12-08 21:03:42 +00:00
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								    if (p->type == process_type_t::block_node) {
 								        const parsed_source_ref_t &source = p->block_node_source;
-												Adopt the new AST in parse_execution

parse_execution is what turns a parsed tree into jobs, etc. Switch it from
parse_tree to the new AST.

											
										
										
											2020-07-03 18:16:51 +00:00
+								        const ast::statement_t *node = p->internal_block_node;
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								        assert(source && node && "Process is missing node info");
-												Remove job_lineage_t

Its responsibilities are now subsumed by job_tree_t except for
the block_io which we pass around explicitly.

											
										
										
											2020-05-29 19:25:36 +00:00
+								        return [=](parser_t &parser) {
-												Adopt the new AST in parse_execution

parse_execution is what turns a parsed tree into jobs, etc. Switch it from
parse_tree to the new AST.

											
										
										
											2020-07-03 18:16:51 +00:00
+								            return parser.eval_node(source, *node, io_chain, job_group).status;
-												Remove job_lineage_t

Its responsibilities are now subsumed by job_tree_t except for
the block_io which we pass around explicitly.

											
										
										
											2020-05-29 19:25:36 +00:00
+								        };
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								    } else {
 								        assert(p->type == process_type_t::function);
-												Rename function_get_properties to function_get_props

We're calling it a lot so let's make it shorter.

											
										
										
											2021-10-21 21:32:35 +00:00
+								        auto props = function_get_props(p->argv0());
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								        if (!props) {
 								            FLOGF(error, _(L"Unknown function '%ls'"), p->argv0());
 								            return proc_performer_t{};
 								        }
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								        const wcstring_list_t &argv = p->argv();
-												Collapse a job's "parent stuff" into a new type job_lineage_t

Currently a job needs to know three things about its "parents:"

1. Any IO redirections for the block or function containing this job
2. The pgid for the parent job
3. Whether the parent job has been fully constructed (to defer self-disown)

These are all tracked in somewhat separate awkward ways. Collapse them
into a single new type job_lineage_t.

											
										
										
											2019-12-08 21:03:42 +00:00
+								        return [=](parser_t &parser) {
-												Properly print leading comments and indentation in `functions`

Store the entire function declaration, not just its job list.
This allows us to extract the body of the function complete with any
leading comments and indents.

Fixes #5285

											
										
										
											2020-01-03 22:40:28 +00:00
+								            // Pull out the job list from the function.
-												Adopt the new AST in parse_execution

parse_execution is what turns a parsed tree into jobs, etc. Switch it from
parse_tree to the new AST.

											
										
										
											2020-07-03 18:16:51 +00:00
+								            const ast::job_list_t &body = props->func_node->jobs;
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								            const block_t *fb = function_prepare_environment(parser, argv, *props);
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								            auto res = parser.eval_node(props->parsed_source, body, io_chain, job_group);
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								            function_restore_environment(parser, fb);
-												Migrate the logic to make empty functions succeed into the performer

This is a more natural place for this logic.

											
										
										
											2019-12-07 19:04:00 +00:00
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								            // If the function did not execute anything, treat it as success.
 								            if (res.was_empty) {
 								                res = proc_status_t::from_exit_code(EXIT_SUCCESS);
-												Migrate the logic to make empty functions succeed into the performer

This is a more natural place for this logic.

											
										
										
											2019-12-07 19:04:00 +00:00
+								            }
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								            return res.status;
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								        };
 								    }
 								}
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								/// Execute a block node or function "process".
-												Rename allow_buffering to piped_output_needs_buffering

This makes the variable's role clear. It controls whether output to a
pipe must be buffered to avoid deadlock.

											
										
										
											2021-02-08 21:33:37 +00:00
+								/// \p piped_output_needs_buffering if true, buffer the output.
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								static launch_result_t exec_block_or_func_process(parser_t &parser, const std::shared_ptr<job_t> &j,
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								                                                  process_t *p, io_chain_t io_chain,
-												Rename allow_buffering to piped_output_needs_buffering

This makes the variable's role clear. It controls whether output to a
pipe must be buffered to avoid deadlock.

											
										
										
											2021-02-08 21:33:37 +00:00
+								                                                  bool piped_output_needs_buffering) {
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    // Create an output buffer if we're piping to another process.
-												io_buffer_t becomes io_bufferfill_t

This makes some significant architectual improvements to io_pipe_t and
io_buffer_t.

Prior to this fix, io_buffer_t subclassed io_pipe_t. io_buffer_t is now
replaced with a class io_bufferfill_t, which does not subclass pipe.

io_pipe_t no longer remembers both fds. Instead it has an autoclose_fd_t,
so that the file descriptor ownership is clear.

											
										
										
											2019-02-01 00:05:42 +00:00
+								    shared_ptr<io_bufferfill_t> block_output_bufferfill{};
-												Rename allow_buffering to piped_output_needs_buffering

This makes the variable's role clear. It controls whether output to a
pipe must be buffered to avoid deadlock.

											
										
										
											2021-02-08 21:33:37 +00:00
+								    if (piped_output_needs_buffering) {
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								        // Be careful to handle failure, e.g. too many open fds.
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								        block_output_bufferfill = io_bufferfill_t::create();
-												io_buffer_t becomes io_bufferfill_t

This makes some significant architectual improvements to io_pipe_t and
io_buffer_t.

Prior to this fix, io_buffer_t subclassed io_pipe_t. io_buffer_t is now
replaced with a class io_bufferfill_t, which does not subclass pipe.

io_pipe_t no longer remembers both fds. Instead it has an autoclose_fd_t,
so that the file descriptor ownership is clear.

											
										
										
											2019-02-01 00:05:42 +00:00
+								        if (!block_output_bufferfill) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								            return launch_result_t::failed;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								        }
-												io_buffer_t becomes io_bufferfill_t

This makes some significant architectual improvements to io_pipe_t and
io_buffer_t.

Prior to this fix, io_buffer_t subclassed io_pipe_t. io_buffer_t is now
replaced with a class io_bufferfill_t, which does not subclass pipe.

io_pipe_t no longer remembers both fds. Instead it has an autoclose_fd_t,
so that the file descriptor ownership is clear.

											
										
										
											2019-02-01 00:05:42 +00:00
+								        // Teach the job about its bufferfill, and add it to our io chain.
 								        io_chain.push_back(block_output_bufferfill);
-												Factor do_fork into a real function

											
										
										
											2018-09-03 21:33:53 +00:00
+								    }
-												Factor block and fish function execution into a "performer" std::function

In preparation for concurrent execution, invert the control of function and
block execution. Allow a process to return an std::function that performs the
the execution. This can be run on either the main or a background thread
(eventually).

											
										
										
											2019-12-01 00:41:42 +00:00
+								    // Get the process performer, and just execute it directly.
 								    // Do it in this scoped way so that the performer function can be eagerly deallocating releasing
 								    // its captured io chain.
-												Collapse a job's "parent stuff" into a new type job_lineage_t

Currently a job needs to know three things about its "parents:"

1. Any IO redirections for the block or function containing this job
2. The pgid for the parent job
3. Whether the parent job has been fully constructed (to defer self-disown)

These are all tracked in somewhat separate awkward ways. Collapse them
into a single new type job_lineage_t.

											
										
										
											2019-12-08 21:03:42 +00:00
+								    if (proc_performer_t performer = get_performer_for_process(p, j.get(), io_chain)) {
 								        p->status = performer(parser);
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    } else {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        return launch_result_t::failed;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    }
-												io_buffer_t becomes io_bufferfill_t

This makes some significant architectual improvements to io_pipe_t and
io_buffer_t.

Prior to this fix, io_buffer_t subclassed io_pipe_t. io_buffer_t is now
replaced with a class io_bufferfill_t, which does not subclass pipe.

io_pipe_t no longer remembers both fds. Instead it has an autoclose_fd_t,
so that the file descriptor ownership is clear.

											
										
										
											2019-02-01 00:05:42 +00:00
+								    // If we have a block output buffer, populate it now.
-												Mild refactoring of exec_block_or_func_process

Reduce some code duplication.

											
										
										
											2020-01-13 22:28:28 +00:00
+								    std::string buffer_contents;
 								    if (block_output_bufferfill) {
 								        // Remove our write pipe and forget it. This may close the pipe, unless another thread has
 								        // claimed it (background write) or another process has inherited it.
 								        io_chain.remove(block_output_bufferfill);
-												Further refactoring of io_buffer_t

Previously we sometimes wanted to access an io_buffer_t to append to it
directly, but that's no longer true; all we really care about is its
separated_buffer_t. Make io_bufferfill_t::finish return the
separated_buffer directly, simplifying call sites. No user visible changes
expected here.

											
										
										
											2021-02-05 01:13:15 +00:00
+								        buffer_contents =
 								            io_bufferfill_t::finish(std::move(block_output_bufferfill)).newline_serialized();
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    }
-												Adopt dup2_list_t in fork execution path

This switches IO redirections after fork() to use the dup2_list_t,
instead of io_chain_t. This results in simpler code with much simpler
error handling.

											
										
										
											2019-01-28 22:35:56 +00:00
-												Factor internal process short-circuiting together

When executing a buffered block or builtin, the usual approach is to
execute, collect output in a string, and then output that string to
stdout or whatever the redirections say. Similarly for stderr.

If we get no output, then we can elide the outputting which means
skipping the background thread. In this case we just mark the process as
finished immediately.

We do this in multiple locations which is confusing. Factor them all
together into a new function run_internal_process_or_short_circuit.

											
										
										
											2020-01-13 22:46:31 +00:00
+								    run_internal_process_or_short_circuit(parser, j, p, std::move(buffer_contents),
 								                                          {} /* errdata */, io_chain);
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    return launch_result_t::ok;
-												Factor do_fork into a real function

											
										
										
											2018-09-03 21:33:53 +00:00
+								}
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								static proc_performer_t get_performer_for_builtin(
 								    process_t *p, job_t *job, const io_chain_t &io_chain,
-												clang-tidy: const reference conversions

These are only read from.

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2021-08-17 20:44:59 +00:00
+								    const std::shared_ptr<output_stream_t> &output_stream,
 								    const std::shared_ptr<output_stream_t> &errput_stream) {
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								    assert(p->type == process_type_t::builtin && "Process must be a builtin");
 								    // Determine if we have a "direct" redirection for stdin.
 								    bool stdin_is_directly_redirected = false;
 								    if (!p->is_first_in_job) {
 								        // We must have a pipe
 								        stdin_is_directly_redirected = true;
 								    } else {
 								        // We are not a pipe. Check if there is a redirection local to the process
 								        // that's not io_mode_t::close.
 								        for (const auto &redir : p->redirection_specs()) {
 								            if (redir.fd == STDIN_FILENO && !redir.is_close()) {
 								                stdin_is_directly_redirected = true;
 								                break;
 								            }
 								        }
 								    }
 								    // Pull out some fields which we want to copy. We don't want to store the process or job in the
 								    // returned closure.
 								    job_group_ref_t job_group = job->group;
 								    const wcstring_list_t &argv = p->argv();
 								    // Be careful to not capture p or j by value, as the intent is that this may be run on another
 								    // thread.
 								    return [=](parser_t &parser) {
 								        auto out_io = io_chain.io_for_fd(STDOUT_FILENO);
 								        auto err_io = io_chain.io_for_fd(STDERR_FILENO);
 								        // Figure out what fd to use for the builtin's stdin.
 								        int local_builtin_stdin = STDIN_FILENO;
 								        if (const auto in = io_chain.io_for_fd(STDIN_FILENO)) {
 								            // Ignore fd redirections from an fd other than the
 								            // standard ones. e.g. in source <&3 don't actually read from fd 3,
 								            // which is internal to fish. We still respect this redirection in
 								            // that we pass it on as a block IO to the code that source runs,
 								            // and therefore this is not an error.
 								            bool ignore_redirect = in->io_mode == io_mode_t::fd && in->source_fd >= 3;
 								            if (!ignore_redirect) {
 								                local_builtin_stdin = in->source_fd;
 								            }
 								        }
 								        // Populate our io_streams_t. This is a bag of information for the builtin.
 								        io_streams_t streams{*output_stream, *errput_stream};
 								        streams.job_group = job_group;
 								        streams.stdin_fd = local_builtin_stdin;
 								        streams.stdin_is_directly_redirected = stdin_is_directly_redirected;
 								        streams.out_is_redirected = out_io != nullptr;
 								        streams.err_is_redirected = err_io != nullptr;
 								        streams.out_is_piped = (out_io && out_io->io_mode == io_mode_t::pipe);
 								        streams.err_is_piped = (err_io && err_io->io_mode == io_mode_t::pipe);
 								        streams.io_chain = &io_chain;
 								        // Execute the builtin.
 								        return builtin_run(parser, argv, streams);
 								    };
 								}
 								/// Executes a builtin "process".
 								static launch_result_t exec_builtin_process(parser_t &parser, const std::shared_ptr<job_t> &j,
 								                                            process_t *p, const io_chain_t &io_chain,
 								                                            bool piped_output_needs_buffering) {
 								    assert(p->type == process_type_t::builtin && "Process is not a builtin");
 								    std::shared_ptr<output_stream_t> out =
 								        create_output_stream_for_builtin(STDOUT_FILENO, io_chain, piped_output_needs_buffering);
 								    std::shared_ptr<output_stream_t> err =
 								        create_output_stream_for_builtin(STDERR_FILENO, io_chain, piped_output_needs_buffering);
 								    if (proc_performer_t performer = get_performer_for_builtin(p, j.get(), io_chain, out, err)) {
 								        p->status = performer(parser);
 								    } else {
 								        return launch_result_t::failed;
 								    }
 								    handle_builtin_output(parser, j, p, io_chain, *out, *err);
 								    return launch_result_t::ok;
 								}
-												Recover from bad redirections in the middle of a job pipeline

Currently fish aborts execution mid-pipeline if a file redirection
failed, which can leave the shell in a broken state (job abandoned after
giving control of the terminal to an already-executed job in the
pipeline).

This patch replaces a failed fd with a closed fd and continues execution
if the affected process wasn't the first in the pipeline.

While this is a hack to address the regression behind fish-shell/#7038
introduced in d62576c, it can also be argued that this behavior is
actually more correct... right?

Closes #7038.

											
										
										
											2020-05-30 04:54:42 +00:00
+								/// Executes a process \p \p in \p job, using the pipes \p pipes (which may have invalid fds if this
 								/// is the first or last process).
-												Stop buffering deferred function processes

If a function process is deferred, allow it to be unbuffered.
This permits certain simple cases where functions are piped to external
commands to execute without buffering.

This is a somewhat-hacky stopgap measure that can't really be extended
to more general concurrent processes. However it is overall an improvement
in user experience that might help flush out some bugs too.

											
										
										
											2019-03-25 04:12:41 +00:00
+								/// \p deferred_pipes represents the pipes from our deferred process; if set ensure they get closed
 								/// in any child. If \p is_deferred_run is true, then this is a deferred run; this affects how
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								/// certain buffering works.
 								/// An error return here indicates that the process failed to launch, and the rest of
 								/// the pipeline should be cancelled.
 								static launch_result_t exec_process_in_job(parser_t &parser, process_t *p,
 								                                           const std::shared_ptr<job_t> &j,
 								                                           const io_chain_t &block_io, autoclose_pipes_t pipes,
 								                                           const autoclose_pipes_t &deferred_pipes,
 								                                           bool is_deferred_run = false) {
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								    // The write pipe (destined for stdout) needs to occur before redirections. For example,
 								    // with a redirection like this:
 								    //
 								    //   `foo 2>&1 | bar`
 								    //
 								    // what we want to happen is this:
 								    //
 								    //    dup2(pipe, stdout)
 								    //    dup2(stdout, stderr)
 								    //
 								    // so that stdout and stderr both wind up referencing the pipe.
 								    //
 								    // The read pipe (destined for stdin) is more ambiguous. Imagine a pipeline like this:
 								    //
 								    //   echo alpha | cat < beta.txt
 								    //
 								    // Should cat output alpha or beta? bash and ksh output 'beta', tcsh gets it right and
 								    // complains about ambiguity, and zsh outputs both (!). No shells appear to output 'alpha',
 								    // so we match bash here. That would mean putting the pipe first, so that it gets trumped by
 								    // the file redirection.
 								    //
 								    // However, eval does this:
 								    //
 								    //   echo "begin; $argv "\n" ;end <&3 3<&-" | source 3<&0
 								    //
 								    // which depends on the redirection being evaluated before the pipe. So the write end of the
 								    // pipe comes first, the read pipe of the pipe comes last. See issue #966.
-												Add support for fish_trace variable to trace execution

This adds support for `fish_trace`, a new variable intended to serve the
same purpose as `set -x` as in bash. Setting this variable to anything
non-empty causes execution to be traced. In the future we may give more
specific meaning to the value of the variable.

The user's prompt is not traced unless you run it explicitly. Events are
also not traced because it is noisy; however autoloading is.

Fixes #3427

											
										
										
											2019-10-19 01:08:22 +00:00
+								    // Maybe trace this process.
 								    // TODO: 'and' and 'or' will not show.
 								    if (trace_enabled(parser)) {
-												Rework null terminated arrays

Several functions including wgetopt and execve operate on null-terminated
arrays of nul-terminated pointers: a list of pointers to C strings where
the last pointer is null. Prior to this change, each process_t stored its
argv in such an array. This had two problems:

1. It was awkward to work with this type, instead of using std::vector,
etc.
2. The process's arguments would be rearranged by builtins which is
surprising

Our null terminated arrays were built around a fancy type that would copy
input strings and also generate an array of pointers to them, in one big
allocation.

Switch to a new model where we construct an array of pointers over
existing strings. So you can supply a `vector<string>` and now
`null_terminated_array_t` will just make a list of pointers to them. Now
processes can just store their argv in a familiar wcstring_list_t.

											
										
										
											2021-02-14 21:15:29 +00:00
+								        trace_argv(parser, nullptr, p->argv());
-												Add support for fish_trace variable to trace execution

This adds support for `fish_trace`, a new variable intended to serve the
same purpose as `set -x` as in bash. Setting this variable to anything
non-empty causes execution to be traced. In the future we may give more
specific meaning to the value of the variable.

The user's prompt is not traced unless you run it explicitly. Events are
also not traced because it is noisy; however autoloading is.

Fixes #3427

											
										
										
											2019-10-19 01:08:22 +00:00
+								    }
-												io_buffer_t becomes io_bufferfill_t

This makes some significant architectual improvements to io_pipe_t and
io_buffer_t.

Prior to this fix, io_buffer_t subclassed io_pipe_t. io_buffer_t is now
replaced with a class io_bufferfill_t, which does not subclass pipe.

io_pipe_t no longer remembers both fds. Instead it has an autoclose_fd_t,
so that the file descriptor ownership is clear.

											
										
										
											2019-02-01 00:05:42 +00:00
+								    // The IO chain for this process.
-												Stop storing block_io in job_t

Prior to this fix, a job would hold onto any IO redirections from its
parent. For example:

    begin
        echo a
    end < file.txt

The "echo a" job would hold a reference to the I/O redirection.
The problem is that jobs then extend the life of pipes until the job is
cleaned up. This can prevent pipes from closing, leading to hangs.

Fix this by not storing the block IO; this ensures that jobs do not
prolong the life of pipes.

Fixes #6397

											
										
										
											2019-12-12 00:34:20 +00:00
+								    io_chain_t process_net_io_chain = block_io;
-												Introduce redirection_spec_t

Prior to this change, a process after it has been constructed by
parse_execution, but before it is executed, was given a list of
io_data_t redirections. The problem is that redirections have a
sensitive ownership policy because they hold onto fds. This made it
rather hard to reason about fd lifetime.

Change these to redirection_spec_t. This is a textual description
of a redirection after expansion. It does not represent an open file and
so its lifetime is no longer important.

This enables files to be held only on the stack, and are no longer owned
by a process of indeterminate lifetime.

											
										
										
											2019-12-13 00:44:24 +00:00
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								    if (pipes.write.valid()) {
 								        process_net_io_chain.push_back(std::make_shared<io_pipe_t>(
 								            p->pipe_write_fd, false /* not input */, std::move(pipes.write)));
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								    }
-												Introduce redirection_spec_t

Prior to this change, a process after it has been constructed by
parse_execution, but before it is executed, was given a list of
io_data_t redirections. The problem is that redirections have a
sensitive ownership policy because they hold onto fds. This made it
rather hard to reason about fd lifetime.

Change these to redirection_spec_t. This is a textual description
of a redirection after expansion. It does not represent an open file and
so its lifetime is no longer important.

This enables files to be held only on the stack, and are no longer owned
by a process of indeterminate lifetime.

											
										
										
											2019-12-13 00:44:24 +00:00
+								    // Append IOs from the process's redirection specs.
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    // This may fail, e.g. a failed redirection.
-												Switch io_file_t to store an fd, not a path

Prior to this fix, a file redirection was turned into an io_file_t. This is
annoying because every place where we want to apply the redirection, we
might fail due to open() failing. Switch to opening the file at the point
we resolve the redirection spec. This will simplify a lot of code.

											
										
										
											2019-12-13 01:27:48 +00:00
+								    if (!process_net_io_chain.append_from_specs(p->redirection_specs(),
 								                                                parser.vars().get_pwd_slash())) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        return launch_result_t::failed;
-												Introduce redirection_spec_t

Prior to this change, a process after it has been constructed by
parse_execution, but before it is executed, was given a list of
io_data_t redirections. The problem is that redirections have a
sensitive ownership policy because they hold onto fds. This made it
rather hard to reason about fd lifetime.

Change these to redirection_spec_t. This is a textual description
of a redirection after expansion. It does not represent an open file and
so its lifetime is no longer important.

This enables files to be held only on the stack, and are no longer owned
by a process of indeterminate lifetime.

											
										
										
											2019-12-13 00:44:24 +00:00
+								    }
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
 								    // Read pipe goes last.
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								    shared_ptr<io_pipe_t> pipe_read{};
 								    if (pipes.read.valid()) {
 								        pipe_read =
 								            std::make_shared<io_pipe_t>(STDIN_FILENO, true /* input */, std::move(pipes.read));
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								        process_net_io_chain.push_back(pipe_read);
 								    }
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								    // If we have stashed pipes, make sure those get closed in the child.
 								    for (const autoclose_fd_t *afd : {&deferred_pipes.read, &deferred_pipes.write}) {
 								        if (afd->valid()) {
 								            process_net_io_chain.push_back(std::make_shared<io_close_t>(afd->fd()));
 								        }
 								    }
-												Fix return code after execution of empty function

											
										
										
											2019-04-13 17:03:25 +00:00
+								    if (p->type != process_type_t::block_node) {
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								        // A simple `begin ... end` should not be considered an execution of a command.
-												Migrate the global exec_count into the parser

											
										
										
											2019-04-28 23:11:49 +00:00
+								        parser.libdata().exec_count++;
-												Fix return code after execution of empty function

											
										
										
											2019-04-13 17:03:25 +00:00
+								    }
-												Support FOO=bar syntax for passing variables to individual commands

This adds initial support for statements with prefixed variable assignments.
Statments like this are supported:

a=1 b=$a echo $b        # outputs 1

Just like in other shells, the left-hand side of each assignment must
be a valid variable identifier (no quoting/escaping).  Array indexing
(PATH[1]=/bin ls $PATH) is *not* yet supported, but can be added fairly
easily.

The right hand side may be any valid string token, like a command
substitution, or a brace expansion.

Since `a=* foo` is equivalent to `begin set -lx a *; foo; end`,
the assignment, like `set`, uses nullglob behavior, e.g. below command
can safely be used to check if a directory is empty.

x=/nothing/{,.}* test (count $x) -eq 0

Generic file completion is done after the equal sign, so for example
pressing tab after something like `HOME=/` completes files in the
root directory
Subcommand completion works, so something like
`GIT_DIR=repo.git and command git ` correctly calls git completions
(but the git completion does not use the variable as of now).

The variable assignment is highlighted like an argument.

Closes #6048

											
										
										
											2019-10-23 01:13:29 +00:00
+								    const block_t *block = nullptr;
 								    cleanup_t pop_block([&]() {
 								        if (block) parser.pop_block(block);
 								    });
 								    if (!p->variable_assignments.empty()) {
 								        block = parser.push_block(block_t::variable_assignment_block());
 								    }
 								    for (const auto &assignment : p->variable_assignments) {
 								        parser.vars().set(assignment.variable_name, ENV_LOCAL | ENV_EXPORT, assignment.values);
 								    }
-												Rename allow_buffering to piped_output_needs_buffering

This makes the variable's role clear. It controls whether output to a
pipe must be buffered to avoid deadlock.

											
										
										
											2021-02-08 21:33:37 +00:00
+								    // Decide if outputting to a pipe may deadlock.
 								    // This happens if fish pipes from an internal process into another internal process:
 								    //    echo $big | string match...
 								    // Here fish will only run one process at a time, so the pipe buffer may overfill.
 								    // It may also happen when piping internal -> external:
 								    //    echo $big | external_proc
 								    // fish wants to run `echo` before launching external_proc, so the pipe may deadlock.
 								    // However if we are a deferred run, it means that we are piping into an external process
 								    // which got launched before us!
 								    bool piped_output_needs_buffering = !p->is_last_in_job && !is_deferred_run;
-												Large refactor of exec.cpp

Break up that monster function.

											
										
										
											2018-09-03 22:56:59 +00:00
+								    // Execute the process.
-												Processes to record topic generations before execution

The sigchld generation expresses the idea that, if we receive a sigchld
signal, the generation will be different than when we last recorded it. A
process cannot exit before it has launched, so check the generation count
before process launch. This is an optimization that reduces failing
waitpid calls.

											
										
										
											2019-02-17 01:35:16 +00:00
+								    p->check_generations_before_launch();
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								    switch (p->type) {
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								        case process_type_t::function:
 								        case process_type_t::block_node: {
-												Rename allow_buffering to piped_output_needs_buffering

This makes the variable's role clear. It controls whether output to a
pipe must be buffered to avoid deadlock.

											
										
										
											2021-02-08 21:33:37 +00:00
+								            if (exec_block_or_func_process(parser, j, p, process_net_io_chain,
 								                                           piped_output_needs_buffering) ==
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								                launch_result_t::failed) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								                return launch_result_t::failed;
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								            }
 								            break;
 								        }
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								        case process_type_t::builtin: {
-												Switch builtin execution to the performer model

In preparation for concurrent execution, introduce a
`get_performer_for_builtin` function. This function itself returns a
function, which when called will run the builtin. The idea is that the
function may be called on a background thread (but not in this commit).

											
										
										
											2021-02-14 22:09:59 +00:00
+								            if (exec_builtin_process(parser, j, p, process_net_io_chain,
 								                                     piped_output_needs_buffering) == launch_result_t::failed) {
 								                return launch_result_t::failed;
 								            }
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								            break;
 								        }
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								        case process_type_t::external: {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								            if (exec_external_command(parser, j, p, process_net_io_chain) ==
 								                launch_result_t::failed) {
 								                return launch_result_t::failed;
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								            }
-												Refactor wait handles

In preparation for using wait handles in --on-process-exit events, factor
wait handles into their own wait handle store. Also switch them to
per-process instead of per-job, which is a simplification.

											
										
										
											2021-05-11 19:01:08 +00:00
+								            // It's possible (though unlikely) that this is a background process which recycled a
 								            // pid from another, previous background process. Forget any such old process.
 								            parser.get_wait_handles().remove_by_pid(p->pid);
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								            break;
 								        }
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								        case process_type_t::exec: {
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								            // We should have handled exec up above.
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								            DIE("process_type_t::exec process found in pipeline, where it should never be. "
 								                "Aborting.");
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								        }
 								    }
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    return launch_result_t::ok;
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								}
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								// Do we have a fish internal process that pipes into a real process? If so, we are going to
 								// launch it last (if there's more than one, just the last one). That is to prevent buffering
 								// from blocking further processes. See #1396.
 								// Example:
 								//   for i in (seq 1 5); sleep 1; echo $i; end | cat
 								// This should show the output as it comes, not buffer until the end.
 								// Any such process (only one per job) will be called the "deferred" process.
 								static process_t *get_deferred_process(const shared_ptr<job_t> &j) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    // Common case is no deferred proc.
 								    if (j->processes.size() <= 1) return nullptr;
 								    // Skip execs, which can only appear at the front.
 								    if (j->processes.front()->type == process_type_t::exec) return nullptr;
 								    // Find the last non-external process, and return it if it pipes into an extenal process.
-												Optimize get_deferred_process() traversal

											
										
										
											2019-03-31 18:20:49 +00:00
+								    for (auto i = j->processes.rbegin(); i != j->processes.rend(); ++i) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        process_t *p = i->get();
 								        if (p->type != process_type_t::external) {
 								            return p->is_last_in_job ? nullptr : p;
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								        }
 								    }
-												Optimize get_deferred_process() traversal

											
										
										
											2019-03-31 18:20:49 +00:00
+								    return nullptr;
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								}
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								/// Given that we failed to execute process \p failed_proc in job \p job, mark that process and
 								/// every subsequent process in the pipeline as aborted before launch.
 								static void abort_pipeline_from(const shared_ptr<job_t> &job, const process_t *failed_proc) {
 								    bool found = false;
 								    for (process_ptr_t &p : job->processes) {
 								        found = found || (p.get() == failed_proc);
 								        if (found) p->mark_aborted_before_launch();
 								    }
 								    assert(found && "Process not present in job");
 								}
-												Migrate the "are you sure you want to exit" logic from parse_execution to exec

This feels more like the sort of logic that should live in the point where
jobs are executed, instead of where jobs are created from parse trees.

											
										
										
											2020-02-20 01:22:54 +00:00
+								// Given that we are about to execute an exec() call, check if the parser is interactive and there
 								// are extant background jobs. If so, warn the user and do not exec().
 								// \return true if we should allow exec, false to disallow it.
 								static bool allow_exec_with_background_jobs(parser_t &parser) {
 								    // If we're not interactive, we cannot warn.
 								    if (!parser.is_interactive()) return true;
 								    // Construct the list of running background jobs.
 								    job_list_t bgs = jobs_requiring_warning_on_exit(parser);
 								    if (bgs.empty()) return true;
 								    // Compare run counts, so we only warn once.
 								    uint64_t current_run_count = reader_run_count();
 								    uint64_t &last_exec_run_count = parser.libdata().last_exec_run_counter;
 								    if (isatty(STDIN_FILENO) && current_run_count - 1 != last_exec_run_count) {
 								        print_exit_warning_for_jobs(bgs);
 								        last_exec_run_count = current_run_count;
 								        return false;
 								    } else {
-												Make hup_background_jobs accept the job list directly

											
										
										
											2020-02-20 03:35:04 +00:00
+								        hup_jobs(parser.jobs());
-												Migrate the "are you sure you want to exit" logic from parse_execution to exec

This feels more like the sort of logic that should live in the point where
jobs are executed, instead of where jobs are created from parse trees.

											
										
										
											2020-02-20 01:22:54 +00:00
+								        return true;
 								    }
 								}
-												Start to unwind lineages

job_lineage was used to track "where jobs came from" but the job tree idea is
a better abstraction. It groups jobs together similar to how a process group
would in other shells. Begin to remove the notion of lineage.

											
										
										
											2020-05-29 19:10:41 +00:00
+								bool exec_job(parser_t &parser, const shared_ptr<job_t> &j, const io_chain_t &block_io) {
-												Don't decompose shared_ptr to raw pointer for exec_job

											
										
										
											2018-10-18 01:07:45 +00:00
+								    assert(j && "null job_t passed to exec_job!");
-												Overhaul job and terminal control

* Instead of reaping all child processes when we receive a SIGCHLD, try
reaping only processes belonging to process groups from fully-
constructed jobs, which should eliminate the need for the keepalive
process entirely (WSL's lack of zombies not withstanding) as now
completed processes are not reaped until the job has been fully
constructed (i.e.  all processes launched), which means their process
group should still be around for new processes to join.

* When `tcgetpgrp()` calls return 0, attempt to `tcsetpgrp()` before
invoking failure handling code.

* When forking a builtin and not running interactively, do not bail if
unable to set/restore terminal attributes.

Fixes #4178. Fixes #3805. Fixes #5210.

											
										
										
											2018-09-29 04:13:13 +00:00
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								    // If fish was invoked with -n or --no-execute, then no_exec will be set and we do nothing.
-												Hide no_exec behind a function

											
										
										
											2019-05-12 22:04:18 +00:00
+								    if (no_exec()) {
-												Fix zombie job on failed redirection in `exec_job`

Closes #5346.

											
										
										
											2018-11-18 23:14:08 +00:00
+								        return true;
-												Teach fish how to push and pop blocks even in the face of no_exec. All tests finally pass.
https://github.com/fish-shell/fish-shell/issues/624

											
										
										
											2013-03-25 23:06:12 +00:00
+								    }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								    // Handle an exec call.
-												Promote process_type_t to an enum class

											
										
										
											2019-03-24 19:29:25 +00:00
+								    if (j->processes.front()->type == process_type_t::exec) {
-												Migrate the "are you sure you want to exit" logic from parse_execution to exec

This feels more like the sort of logic that should live in the point where
jobs are executed, instead of where jobs are created from parse trees.

											
										
										
											2020-02-20 01:22:54 +00:00
+								        // If we are interactive, perhaps disallow exec if there are background jobs.
 								        if (!allow_exec_with_background_jobs(parser)) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								            for (const auto &p : j->processes) {
 								                p->mark_aborted_before_launch();
 								            }
-												Migrate the "are you sure you want to exit" logic from parse_execution to exec

This feels more like the sort of logic that should live in the point where
jobs are executed, instead of where jobs are created from parse trees.

											
										
										
											2020-02-20 01:22:54 +00:00
+								            return false;
 								        }
-												Start to unwind lineages

job_lineage was used to track "where jobs came from" but the job tree idea is
a better abstraction. It groups jobs together similar to how a process group
would in other shells. Begin to remove the notion of lineage.

											
										
										
											2020-05-29 19:10:41 +00:00
+								        internal_exec(parser.vars(), j.get(), block_io);
-												src/exec: fix assertion on failed exec redirection

Minimal reproducer: `fish -c "exec cat<x"`

											
										
										
											2019-02-11 16:10:42 +00:00
+								        // internal_exec only returns if it failed to set up redirections.
 								        // In case of an successful exec, this code is not reached.
-												Rationalize a bit of how failed exec() works

We don't need to mark the job as completed in this case, because the
caller will remove the job.

											
										
										
											2020-01-13 22:18:43 +00:00
+								        int status = j->flags().negate ? 0 : 1;
-												Make $status and $pipestatus per-parser

Another step towards allowing multiple parsers to execute in parallel.

											
										
										
											2019-05-12 21:00:44 +00:00
+								        parser.set_last_statuses(statuses_t::just(status));
-												Rationalize a bit of how failed exec() works

We don't need to mark the job as completed in this case, because the
caller will remove the job.

											
										
										
											2020-01-13 22:18:43 +00:00
 								        // A false return tells the caller to remove the job from the list.
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								        for (const auto &p : j->processes) {
 								            p->mark_aborted_before_launch();
 								        }
-												src/exec: fix assertion on failed exec redirection

Minimal reproducer: `fish -c "exec cat<x"`

											
										
										
											2019-02-11 16:10:42 +00:00
+								        return false;
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    }
-												Make the 'time' keyword a fixed property of a job.

The 'time' prefix may come about either because the job itself is marked
with time, or because of the "inside out" weirdness of 'not time...'.
Factor this logic together and precompute it for a job.

											
										
										
											2020-09-01 20:43:57 +00:00
+								    cleanup_t timer = push_timer(j->wants_timing() && !no_exec());
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								    // Get the deferred process, if any. We will have to remember its pipes.
 								    autoclose_pipes_t deferred_pipes;
 								    process_t *const deferred_process = get_deferred_process(j);
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								    // We may want to transfer tty ownership to the pgroup leader.
 								    tty_transfer_t transfer{};
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
+								    // This loop loops over every process_t in the job, starting it as appropriate. This turns out
 								    // to be rather complex, since a process_t can be one of many rather different things.
 								    //
 								    // The loop also has to handle pipelining between the jobs.
 								    //
 								    // We can have up to three pipes "in flight" at a time:
 								    //
 								    // 1. The pipe the current process should read from (courtesy of the previous process)
 								    // 2. The pipe that the current process should write to
 								    // 3. The pipe that the next process should read from (courtesy of us)
 								    //
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    // Lastly, a process may experience a pipeline-aborting error, which prevents launching
 								    // further processes in the pipeline.
-												Factor out launch_process from exec.cpp

Makes the monster function slightly more tractable.

											
										
										
											2018-09-01 21:48:22 +00:00
+								    autoclose_fd_t pipe_next_read;
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    bool aborted_pipeline = false;
 								    size_t procs_launched = 0;
 								    for (const auto &procptr : j->processes) {
 								        process_t *p = procptr.get();
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								        // proc_pipes is the pipes applied to this process. That is, it is the read end
 								        // containing the output of the previous process (if any), plus the write end that will
 								        // output to the next process (if any).
 								        autoclose_pipes_t proc_pipes;
 								        proc_pipes.read = std::move(pipe_next_read);
 								        if (!p->is_last_in_job) {
-												Pipe fds to move to the "high range"

This concerns how fish prevents its own fds from interfering with
user-defined fd redirections, like `echo hi >&5`. fish has historically
done this by tracking all user defined redirections when running a job,
and ensuring that pipes are not assigned the same fds. However this is
annoying to pass around - it means that we have to thread user-defined
redirections into pipe creation.

Take a page from zsh and just ensure that all pipes we create have fds in
the "high range," which here means at least 10. The primary way to do this
is via the F_DUPFD_CLOEXEC syscall, which also sets CLOEXEC, so we aren't
invoking additional syscalls in the common case. This will free us from
having to track which fds are in user-defined redirections.

											
										
										
											2021-02-03 04:30:52 +00:00
+								            auto pipes = make_autoclose_pipes();
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								            if (!pipes) {
-												Replace debug(1) with FLOGF(warning)

											
										
										
											2020-01-19 12:38:47 +00:00
+								                FLOGF(warning, PIPE_ERROR);
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								                wperror(L"pipe");
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								                aborted_pipeline = true;
 								                abort_pipeline_from(j, p);
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								                break;
 								            }
 								            pipe_next_read = std::move(pipes->read);
 								            proc_pipes.write = std::move(pipes->write);
-												Refactor deferred_process handling to be more clearly safe

The previous layout confused me for a minute as it suggested it was
possible for `pipe_next_read` to be moved twice (once in the first
conditional block, then again when the deferred process conditional
called `continue` - if and only if the deferred process *was* the last
process in the job. This patch clarifies that can't be the case.

											
										
										
											2021-08-18 01:10:19 +00:00
+								            // Save any deferred process for last. By definition, the deferred process can never be
 								            // the last process in the job, so it's safe to nest this in the outer
 								            // `if (!p->is_last_in_job)` block, which makes it clear that `proc_next_read` will
 								            // always be assigned when we `continue` the loop.
 								            if (p == deferred_process) {
 								                deferred_pipes = std::move(proc_pipes);
 								                continue;
 								            }
-												Switch a job's process list from a linked list to a vector of pointers

Clarifies and simplifies the memory management around process handling.

											
										
										
											2017-01-23 17:28:34 +00:00
+								        }
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
 								        // Regular process.
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								        if (exec_process_in_job(parser, p, j, block_io, std::move(proc_pipes), deferred_pipes) ==
 								            launch_result_t::failed) {
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								            aborted_pipeline = true;
 								            abort_pipeline_from(j, p);
 								            break;
 								        }
 								        procs_launched += 1;
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
 								        // Transfer tty?
 								        if (p->leads_pgrp && j->group->wants_terminal()) {
 								            transfer.to_job_group(j->group);
 								        }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    }
-												Revert "Fix undefined behavior in closing a moved pipe"

There is no undefined behavior in closing a moved pipe, since the
move constructor simply sets the fd to -1, which is ignored by close().
The move constructor of autoclose_fd_t is "fully specified" (like
unique_ptr).

It's good practice to eagerly close pipes which may be inherited by
child processes, since otherwise the writer may not get EPIPE correctly.
Closing the pipe explicitly makes it clear that the pipe does not stay
open across continue_job().

This reverts commit c014c23662f77498cd69b2c5e99ec9bdba9c9a3a.

											
										
										
											2021-12-28 22:16:06 +00:00
+								    pipe_next_read.close();
-												restyle exec module to match project style

Reduces lint errors from 121 to 59 (-51%). Line count from 1578 to 1290 (-18%).

Another step in resolving issue #2902.

											
										
										
											2016-04-29 02:41:54 +00:00
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								    // If our pipeline was aborted before any process was successfully launched, then there is
 								    // nothing to reap, and we can perform an early return.
 								    // Note we must never return false if we have launched even one process, since it will not be
 								    // properly reaped; see #7038.
 								    if (aborted_pipeline && procs_launched == 0) {
 								        return false;
 								    }
 								    // Ok, at least one thing got launched.
 								    // Handle any deferred process.
 								    if (deferred_process) {
 								        if (aborted_pipeline) {
 								            // Some other process already aborted our pipeline.
 								            deferred_process->mark_aborted_before_launch();
 								        } else if (exec_process_in_job(parser, deferred_process, j, block_io,
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								                                       std::move(deferred_pipes), {},
-												Tighten up pipeline-aborting errors

Prior to this change, the functions in exec.cpp would return true or false
and it was not clear what significance that value had.

Switch to an enum to make this more explicit. In particular we have the
idea of a "pipeline breaking" error which should us to skip processes
which have not yet launched; if no process launches then we can bail out
to a different path which avoids reaping processes.

											
										
										
											2020-12-13 23:39:20 +00:00
+								                                       true) == launch_result_t::failed) {
 								            // The deferred proc itself failed to launch.
 								            deferred_process->mark_aborted_before_launch();
-												Introduce the notion of a deferred process

In a job, a deferred process is the last fish internal process which pipes
to an external command. Execute the deferred process last; this will allow
for streaming its output.

											
										
										
											2019-03-24 21:27:23 +00:00
+								        }
 								    }
-												Refactor job pgroup assignment

This is a cleanup of job groups, rationalizing a bunch of stuff. Some
notable changes (none user-visible hopefully):

1. Previously, if a job group wanted a pgid, then we would assign it to the
   first process to run in the job group. Now we deliberately mark which
   process will own the pgroup, via a new `leads_pgrp` flag in process_t. This
   eliminates a source of ambiguity.

2. Previously, if a job were run inside fish's pgroup, we would set fish's
   pgroup as the group of the job. But this meant we had to check if the job
   had fish's pgroup in lots of places, for example when calling tcsetpgrp.
   Now a job group only has a pgrp if that pgrp is external (i.e. the job is
   under job control).

											
										
										
											2022-02-19 18:05:50 +00:00
+								    FLOGF(exec_job_exec, L"Executed job %d from command '%ls'", j->job_id(), j->command_wcstr());
-												Bring some consistency and rationale to debug log levels

* Debug level 3: describe all commands being executed (this is, after all,
a shell and one can argue that this is the most important debug
information avaliable)
* Debug level 4: details of execution, mainly fork vs no-fork and io
handling

Also introduced j->preview() to print a short descriptor of the job
based on the head of the first process so we don't overwhelm with
needless repitition, but also so that we don't have to rely on
distinguishing between repeated, non-unique/non-monotonic job ids that
are often recycled within a single "execution cycle" (pressing enter
once).

											
										
										
											2018-10-02 16:19:56 +00:00
-												Correct the use of the constructed pointer in job lineage

This was always being set to a different pointer. Ensure the root job
shares its constructed pointer with its children.

											
										
										
											2019-12-11 02:32:56 +00:00
+								    j->mark_constructed();
-												Fix assertion failure on job redirection error

Fix an error caused by `exec_job()` assuming a job launched with the
intention of being backgrounded would have a pgid assigned in all cases,
without considering the status of `exec_error` which could have resulted
in the job failing before it was launched into its own process group.

Fixes (but doesn't close) #7423 - that can be closed if this assertion
failure doesn't happen in any released fish versions.

											
										
										
											2020-10-24 21:11:46 +00:00
 								    // If exec_error then a backgrounded job would have been terminated before it was ever assigned
 								    // a pgroup, so error out before setting last_pid.
-												Switch last_pid from the pgroup to the actual last pid

When a job is placed in the background, fish will set the `$last_pid`
variable. Prior to this change, `$last_pid` was set to the process group
leader of the job. However this caussed problems when the job ran in
fish's process group, because then fish itself would be the process group
leader and commands like `wait` would not work.

Switch `$last_pid` to be the actual last pid of the pipeline. This brings
it in line with the `$!` variable from zsh and bash.

This is technically a breaking change, but it is unlikely to cause
problems, because `$last_pid` was already rather broken.

Fixes #5036
Fixes #5832
Fixes #7721

											
										
										
											2021-05-18 19:35:37 +00:00
+								    if (!j->is_foreground()) {
 								        if (maybe_t<pid_t> last_pid = j->get_last_pid()) {
 								            parser.vars().set_one(L"last_pid", ENV_GLOBAL, to_string(*last_pid));
 								        } else {
 								            parser.vars().set_empty(L"last_pid", ENV_GLOBAL);
 								        }
-												Apply new indentation, brace, and whitespace style

											
										
										
											2012-11-19 00:30:30 +00:00
+								    }
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
-												Refactor tty transfer to be more deliberate

This is a big cleanup to how tty transfer works. Recall that when job
control is active, we transfer the tty to jobs via tcsetpgrp().

Previously, transferring was done "as needed" in continue_job. That is, if
we are running a job, and the job wants the terminal and does not have it,
we will transfer the tty at that point.

This got pretty weird when running mixed pipelines. For example:

    cmd1 | func1 | cmd2

Here we would run `func1` before calling continue_job. Thus the tty
would be transferred by the nested function invocation, and also restored
by that invocation, potentially racing with tty manipulation from cmd1 or
cmd2.

In the new model, migrate the tty transfer responsibility outside of
continue_job. The caller of continue_job is then responsible for setting up
the tty. There's two places where this gets done:

1. In `exec_job`, where we run a job for the first time.

2. In `builtin_fg` where we continue a stopped job in the foreground.

Fixes #8699

											
										
										
											2022-02-13 21:12:18 +00:00
+								    if (!j->is_initially_background()) {
 								        j->continue_job(parser);
 								    }
 								    if (j->is_stopped()) transfer.save_tty_modes();
 								    transfer.reclaim();
-												Fix zombie job on failed redirection in `exec_job`

Closes #5346.

											
										
										
											2018-11-18 23:14:08 +00:00
+								    return true;
-												Some changes to migrate towards C++ and a multithreaded model

											
										
										
											2011-12-27 03:18:46 +00:00
+								}
-												remove trailing spaces

This is done by `sed -i -e 's/[ \t]*$//' *.[c,h]`, which should not
introduce any functionality change.

											
										
										
											2010-09-18 01:51:16 +00:00
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								/// Populate \p lst with the output of \p buffer, perhaps splitting lines according to \p split.
-												Improve locking discipline in io_buffer_t

Previously we had a lock that was taken in an ad-hoc manner. Switch to
using owning_lock.

											
										
										
											2021-02-05 01:02:31 +00:00
+								static void populate_subshell_output(wcstring_list_t *lst, const separated_buffer_t &buffer,
 								                                     bool split) {
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								    // Walk over all the elements.
-												Improve locking discipline in io_buffer_t

Previously we had a lock that was taken in an ad-hoc manner. Switch to
using owning_lock.

											
										
										
											2021-02-05 01:02:31 +00:00
+								    for (const auto &elem : buffer.elements()) {
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								        if (elem.is_explicitly_separated()) {
 								            // Just append this one.
 								            lst->push_back(str2wcstring(elem.contents));
 								            continue;
 								        }
-												Trim trailing newline on cmdsubst when IFS=''

When $IFS is empty, command substitution no longer splits on newlines.
However we still want to trim off a single trailing newline, as most
commands will emit a trailing newline and it makes it harder to work
with their output.

											
										
										
											2014-08-29 01:27:23 +00:00
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								        // Not explicitly separated. We have to split it explicitly.
 								        assert(!elem.is_explicitly_separated() && "should not be explicitly separated");
 								        const char *begin = elem.contents.data();
 								        const char *end = begin + elem.contents.size();
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								        if (split) {
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								            const char *cursor = begin;
 								            while (cursor < end) {
 								                // Look for the next separator.
-												[clang-tidy] use auto when casting

Found with modernize-use-auto

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2020-04-02 23:04:04 +00:00
+								                auto stop = static_cast<const char *>(std::memchr(cursor, '\n', end - cursor));
-												[clang-tidy] Replace NULL with nullptr

Found with modernize-use-nullptr

Signed-off-by: Rosen Penev <rosenp@gmail.com>

											
										
										
											2019-11-19 02:34:50 +00:00
+								                const bool hit_separator = (stop != nullptr);
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								                if (!hit_separator) {
 								                    // If it's not found, just use the end.
 								                    stop = end;
 								                }
 								                // Stop now points at the first character we do not want to copy.
 								                lst->push_back(str2wcstring(cursor, stop - cursor));
-												lint: Use early exit/continue

											
										
										
											2016-10-30 23:04:13 +00:00
-												Add string split0

This adds a new string command split0, which splits on zero bytes.
split0 has superpowers because its output is not further split on
newlines when used in command substitutions.

											
										
										
											2018-05-30 04:11:50 +00:00
+								                // If we hit a separator, skip over it; otherwise we're at the end.
 								                cursor = stop + (hit_separator ? 1 : 0);
 								            }
 								        } else {
 								            // We're not splitting output, but we still want to trim off a trailing newline.
 								            if (end != begin && end[-1] == '\n') {
 								                --end;
 								            }
 								            lst->push_back(str2wcstring(begin, end - begin));
-												Remove trailing whitespaces and change tabs to spaces

											
										
										
											2012-11-18 10:23:22 +00:00
+								        }
 								    }
-												Initial revision

darcs-hash:20050920132639-ac50b-fa3b476891e1f5f67207cf4cc7bf623834cc5edc.gz

											
										
										
											2005-09-20 13:26:39 +00:00
+								}
-												Clean up exec_subshell, removing al_list from it

											
										
										
											2012-02-08 07:35:41 +00:00
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								/// Execute \p cmd in a subshell in \p parser. If \p lst is not null, populate it with the output.
 								/// Return $status in \p out_status.
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								/// If \p job_group is set, any spawned commands should join that job group.
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								/// If \p apply_exit_status is false, then reset $status back to its original value.
 								/// \p is_subcmd controls whether we apply a read limit.
 								/// \p break_expand is used to propagate whether the result should be "expansion breaking" in the
 								/// sense that subshells used during string expansion should halt that expansion. \return the value
 								/// of $status.
-												Teach a job to decide its job tree

Job trees come in two flavors: “placeholders” for jobs which are only fish
functions, and non-placeholders which need to track a pgid. This adds
logic to allow a job to decide if its parent's job tree is appropriate,
and allocating a new tree if not.

											
										
										
											2020-02-08 22:34:10 +00:00
+								static int exec_subshell_internal(const wcstring &cmd, parser_t &parser,
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								                                  const job_group_ref_t &job_group, wcstring_list_t *lst,
-												Teach a job to decide its job tree

Job trees come in two flavors: “placeholders” for jobs which are only fish
functions, and non-placeholders which need to track a pgid. This adds
logic to allow a job to decide if its parent's job tree is appropriate,
and allocating a new tree if not.

											
										
										
											2020-02-08 22:34:10 +00:00
+								                                  bool *break_expand, bool apply_exit_status, bool is_subcmd) {
-												Replace a bunch of ASSERT_IS_MAIN_THREAD

Switch these to a new function parser.assert_can_execute(), in
preparation for allowing execution off of the main thread.

											
										
										
											2022-06-19 23:27:06 +00:00
+								    parser.assert_can_execute();
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								    auto &ld = parser.libdata();
 								    scoped_push<bool> is_subshell(&ld.is_subshell, true);
 								    scoped_push<size_t> read_limit(&ld.read_limit, is_subcmd ? read_byte_limit : 0);
 								    auto prev_statuses = parser.get_last_statuses();
 								    const cleanup_t put_back([&] {
 								        if (!apply_exit_status) {
 								            parser.set_last_statuses(prev_statuses);
 								        }
 								    });
 								    const bool split_output = !parser.vars().get(L"IFS").missing_or_empty();
 								    // IO buffer creation may fail (e.g. if we have too many open files to make a pipe), so this may
 								    // be null.
-												Remove fd_set_t

Now that we no longer need to worry about pipes conflicting with
user-specified redirections, we can remove fd_set_t.

											
										
										
											2021-02-06 02:14:50 +00:00
+								    auto bufferfill = io_bufferfill_t::create(ld.read_limit);
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								    if (!bufferfill) {
 								        *break_expand = true;
 								        return STATUS_CMD_ERROR;
 								    }
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								    eval_res_t eval_res = parser.eval(cmd, io_chain_t{bufferfill}, job_group, block_type_t::subst);
-												Further refactoring of io_buffer_t

Previously we sometimes wanted to access an io_buffer_t to append to it
directly, but that's no longer true; all we really care about is its
separated_buffer_t. Make io_bufferfill_t::finish return the
separated_buffer directly, simplifying call sites. No user visible changes
expected here.

											
										
										
											2021-02-05 01:13:15 +00:00
+								    separated_buffer_t buffer = io_bufferfill_t::finish(std::move(bufferfill));
-												Improve locking discipline in io_buffer_t

Previously we had a lock that was taken in an ad-hoc manner. Switch to
using owning_lock.

											
										
										
											2021-02-05 01:02:31 +00:00
+								    if (buffer.discarded()) {
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								        *break_expand = true;
 								        return STATUS_READ_TOO_MUCH;
 								    }
 								    if (eval_res.break_expand) {
 								        *break_expand = true;
 								        return eval_res.status.status_value();
 								    }
 								    if (lst) {
-												Improve locking discipline in io_buffer_t

Previously we had a lock that was taken in an ad-hoc manner. Switch to
using owning_lock.

											
										
										
											2021-02-05 01:02:31 +00:00
+								        populate_subshell_output(lst, buffer, split_output);
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								    }
 								    *break_expand = false;
 								    return eval_res.status.status_value();
-												Clean up exec_subshell, removing al_list from it

											
										
										
											2012-02-08 07:35:41 +00:00
+								}
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								int exec_subshell_for_expand(const wcstring &cmd, parser_t &parser,
 								                             const job_group_ref_t &job_group, wcstring_list_t &outputs) {
-												Replace a bunch of ASSERT_IS_MAIN_THREAD

Switch these to a new function parser.assert_can_execute(), in
preparation for allowing execution off of the main thread.

											
										
										
											2022-06-19 23:27:06 +00:00
+								    parser.assert_can_execute();
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								    bool break_expand = false;
-												Rename job_tree to job_group

Initially I wanted to pick a different name to avoid confusion with
process groups, but really job trees *are* process groups. So name them
to reflect that fact.

Also rename "placeholder" to "internal" which is clearer.

											
										
										
											2020-05-30 21:05:07 +00:00
+								    int ret = exec_subshell_internal(cmd, parser, job_group, &outputs, &break_expand, true, true);
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								    // Only return an error code if we should break expansion.
 								    return break_expand ? ret : STATUS_CMD_OK;
 								}
 								int exec_subshell(const wcstring &cmd, parser_t &parser, bool apply_exit_status) {
 								    bool break_expand = false;
-												Teach a job to decide its job tree

Job trees come in two flavors: “placeholders” for jobs which are only fish
functions, and non-placeholders which need to track a pgid. This adds
logic to allow a job to decide if its parent's job tree is appropriate,
and allocating a new tree if not.

											
										
										
											2020-02-08 22:34:10 +00:00
+								    return exec_subshell_internal(cmd, parser, nullptr, nullptr, &break_expand, apply_exit_status,
-												Thread pgroups into command substitutions

Give string expansion an (optional) parent pgroup. This is threaded all
the way into eval(). This ensures that in a mixed pipeline like:

   cmd | begin ; something (cmd2) ; end

that cmd2 and cmd have the same pgroup.

Add a test to ensure that command substitutions inherit pgroups
properly.

Fixes #6624

											
										
										
											2020-03-11 18:06:52 +00:00
+								                                  false);
-												Rationalize $status and errors

Prior to this fix, fish was rather inconsistent in when $status gets set
in response to an error. For example, a failed expansion like "$foo["
would not modify $status.

This makes the following inter-related changes:

1. String expansion now directly returns the value to set for $status on
error. The value is always used.

2. parser_t::eval() now directly returns the proc_status_t, which cleans
up a lot of call sites.

3. We expose a new function exec_subshell_for_expand() which ignores
$status but returns errors specifically related to subshell expansion.

4. We reify the notion of "expansion breaking" errors. These include
command-not-found, expand syntax errors, and others.

The upshot is we are more consistent about always setting $status on
errors.

											
										
										
											2020-01-24 01:34:46 +00:00
+								}
 								int exec_subshell(const wcstring &cmd, parser_t &parser, wcstring_list_t &outputs,
 								                  bool apply_exit_status) {
 								    bool break_expand = false;
-												Teach a job to decide its job tree

Job trees come in two flavors: “placeholders” for jobs which are only fish
functions, and non-placeholders which need to track a pgid. This adds
logic to allow a job to decide if its parent's job tree is appropriate,
and allocating a new tree if not.

											
										
										
											2020-02-08 22:34:10 +00:00
+								    return exec_subshell_internal(cmd, parser, nullptr, &outputs, &break_expand, apply_exit_status,
-												Thread pgroups into command substitutions

Give string expansion an (optional) parent pgroup. This is threaded all
the way into eval(). This ensures that in a mixed pipeline like:

   cmd | begin ; something (cmd2) ; end

that cmd2 and cmd have the same pgroup.

Add a test to ensure that command substitutions inherit pgroups
properly.

Fixes #6624

											
										
										
											2020-03-11 18:06:52 +00:00
+								                                  false);
-												Clean up exec_subshell, removing al_list from it

											
										
										
											2012-02-08 07:35:41 +00:00
+								}