mirror of
https://github.com/nushell/nushell
synced 2024-12-31 23:39:00 +00:00
6c649809d3
This PR is a complete rewrite of `run_external.rs`. The main goal of the rewrite is improving readability, but it also fixes some bugs related to argument handling and the PATH variable (fixes https://github.com/nushell/nushell/issues/6011). I'll discuss some technical details to make reviewing easier. ## Argument handling Quoting arguments for external commands is hard. Like, *really* hard. We've had more than a dozen issues and PRs dedicated to quoting arguments (see Appendix) but the current implementation is still buggy. Here's a demonstration of the buggy behavior: ```nu let foo = "'bar'" ^touch $foo # This creates a file named `bar`, but it should be `'bar'` ^touch ...[ "'bar'" ] # Same ``` I'll describe how this PR deals with argument handling. First, we'll introduce the concept of **bare strings**. Bare strings are **string literals** that are either **unquoted** or **quoted by backticks** [^1]. Strings within a list literal are NOT considered bare strings, even if they are unquoted or quoted by backticks. When a bare string is used as an argument to external process, we need to perform tilde-expansion, glob-expansion, and inner-quotes-removal, in that order. "Inner-quotes-removal" means transforming from `--option="value"` into `--option=value`. ## `.bat` files and CMD built-ins On Windows, `.bat` files and `.cmd` files are considered executable, but they need `CMD.exe` as the interpreter. The Rust standard library supports running `.bat` files directly and will spawn `CMD.exe` under the hood (see [documentation](https://doc.rust-lang.org/std/process/index.html#windows-argument-splitting)). However, other extensions are not supported [^2]. Nushell also supports a selected number of CMD built-ins. The problem with CMD is that it uses a different set of quoting rules. Correctly quoting for CMD requires using [Command::raw_arg()](https://doc.rust-lang.org/std/os/windows/process/trait.CommandExt.html#tymethod.raw_arg) and manually quoting CMD special characters, on top of quoting from the Nushell side. ~~I decided that this is too complex and chose to reject special characters in CMD built-ins instead [^3]. Hopefully this will not affact real-world use cases.~~ I've implemented escaping that works reasonably well. ## `which-support` feature The `which` crate is now a hard dependency of `nu-command`, making the `which-support` feature essentially useless. The `which` crate is already a hard dependency of `nu-cli`, and we should consider removing the `which-support` feature entirely. ## Appendix Here's a list of quoting-related issues and PRs in rough chronological order. * https://github.com/nushell/nushell/issues/4609 * https://github.com/nushell/nushell/issues/4631 * https://github.com/nushell/nushell/issues/4601 * https://github.com/nushell/nushell/pull/5846 * https://github.com/nushell/nushell/issues/5978 * https://github.com/nushell/nushell/pull/6014 * https://github.com/nushell/nushell/issues/6154 * https://github.com/nushell/nushell/pull/6161 * https://github.com/nushell/nushell/issues/6399 * https://github.com/nushell/nushell/pull/6420 * https://github.com/nushell/nushell/pull/6426 * https://github.com/nushell/nushell/issues/6465 * https://github.com/nushell/nushell/issues/6559 * https://github.com/nushell/nushell/pull/6560 [^1]: The idea that backtick-quoted strings act like bare strings was introduced by Kubouch and briefly mentioned in [the language reference](https://www.nushell.sh/lang-guide/chapters/strings_and_text.html#backtick-quotes). [^2]: The documentation also said "running .bat scripts in this way may be removed in the future and so should not be relied upon", which is another reason to move away from this. But again, quoting for CMD is hard. [^3]: If anyone wants to try, the best resource I found on the topic is [this](https://daviddeley.com/autohotkey/parameters/parameters.htm).
199 lines
5 KiB
Rust
199 lines
5 KiB
Rust
use crate::repl::tests::{fail_test, run_test, TestResult};
|
|
use nu_test_support::nu;
|
|
|
|
#[test]
|
|
fn spread_in_list() -> TestResult {
|
|
run_test(r#"[...[]] | to nuon"#, "[]").unwrap();
|
|
run_test(
|
|
r#"[1 2 ...[[3] {x: 1}] 5] | to nuon"#,
|
|
"[1, 2, [3], {x: 1}, 5]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"[...("foo" | split chars) 10] | to nuon"#,
|
|
"[f, o, o, 10]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"let l = [1, 2, [3]]; [...$l $l] | to nuon"#,
|
|
"[1, 2, [3], [1, 2, [3]]]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"[ ...[ ...[ ...[ a ] b ] c ] d ] | to nuon"#,
|
|
"[a, b, c, d]",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn not_spread() -> TestResult {
|
|
run_test(r#"def ... [x] { $x }; ... ..."#, "...").unwrap();
|
|
run_test(
|
|
r#"let a = 4; [... $a ... [1] ... (5) ...bare ...] | to nuon"#,
|
|
"[..., 4, ..., [1], ..., 5, ...bare, ...]",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn bad_spread_on_non_list() -> TestResult {
|
|
fail_test(r#"let x = 5; [...$x]"#, "cannot spread").unwrap();
|
|
fail_test(r#"[...({ x: 1 })]"#, "cannot spread")
|
|
}
|
|
|
|
#[test]
|
|
fn spread_type_list() -> TestResult {
|
|
run_test(
|
|
r#"def f [a: list<int>] { $a | describe }; f [1 ...[]]"#,
|
|
"list<int>",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"def f [a: list<int>] { $a | describe }; f [1 ...[2]]"#,
|
|
"list<int>",
|
|
)
|
|
.unwrap();
|
|
fail_test(
|
|
r#"def f [a: list<int>] { }; f ["foo" ...[4 5 6]]"#,
|
|
"expected int",
|
|
)
|
|
.unwrap();
|
|
fail_test(
|
|
r#"def f [a: list<int>] { }; f [1 2 ...["misfit"] 4]"#,
|
|
"expected int",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn spread_in_record() -> TestResult {
|
|
run_test(r#"{...{...{...{}}}} | to nuon"#, "{}").unwrap();
|
|
run_test(
|
|
r#"{foo: bar ...{a: {x: 1}} b: 3} | to nuon"#,
|
|
"{foo: bar, a: {x: 1}, b: 3}",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn duplicate_cols() -> TestResult {
|
|
fail_test(r#"{a: 1, ...{a: 3}}"#, "column used twice").unwrap();
|
|
fail_test(r#"{...{a: 4, x: 3}, x: 1}"#, "column used twice").unwrap();
|
|
fail_test(r#"{...{a: 0, x: 2}, ...{x: 5}}"#, "column used twice")
|
|
}
|
|
|
|
#[test]
|
|
fn bad_spread_on_non_record() -> TestResult {
|
|
fail_test(r#"let x = 5; { ...$x }"#, "cannot spread").unwrap();
|
|
fail_test(r#"{...([1, 2])}"#, "cannot spread")
|
|
}
|
|
|
|
#[test]
|
|
fn spread_type_record() -> TestResult {
|
|
run_test(
|
|
r#"def f [a: record<x: int>] { $a.x }; f { ...{x: 0} }"#,
|
|
"0",
|
|
)
|
|
.unwrap();
|
|
fail_test(
|
|
r#"def f [a: record<x: int>] {}; f { ...{x: "not an int"} }"#,
|
|
"type_mismatch",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn spread_external_args() {
|
|
assert_eq!(
|
|
nu!(r#"nu --testbin cococo ...[1 "foo"] 2 ...[3 "bar"]"#).out,
|
|
"1 foo 2 3 bar",
|
|
);
|
|
// exec doesn't have rest parameters but allows unknown arguments
|
|
assert_eq!(
|
|
nu!(r#"exec nu --testbin cococo "foo" ...[5 6]"#).out,
|
|
"foo 5 6"
|
|
);
|
|
}
|
|
|
|
#[test]
|
|
fn spread_internal_args() -> TestResult {
|
|
run_test(
|
|
r#"
|
|
let list = ["foo" 4]
|
|
def f [a b c? d? ...x] { [$a $b $c $d $x] | to nuon }
|
|
f 1 2 ...[5 6] 7 ...$list"#,
|
|
"[1, 2, null, null, [5, 6, 7, foo, 4]]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"
|
|
def f [a b c? d? ...x] { [$a $b $c $d $x] | to nuon }
|
|
f 1 2 3 ...[5 6]"#,
|
|
"[1, 2, 3, null, [5, 6]]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"
|
|
def f [--flag: int ...x] { [$flag $x] | to nuon }
|
|
f 2 ...[foo] 4 --flag 5 6 ...[7 8]"#,
|
|
"[5, [2, foo, 4, 6, 7, 8]]",
|
|
)
|
|
.unwrap();
|
|
run_test(
|
|
r#"
|
|
def f [a b? --flag: int ...x] { [$a $b $flag $x] | to nuon }
|
|
f 1 ...[foo] 4 --flag 5 6 ...[7 8]"#,
|
|
"[1, null, 5, [foo, 4, 6, 7, 8]]",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn bad_spread_internal_args() -> TestResult {
|
|
fail_test(
|
|
r#"
|
|
def f [a b c? d? ...x] { echo $a $b $c $d $x }
|
|
f 1 ...[5 6]"#,
|
|
"Missing required positional argument",
|
|
)
|
|
.unwrap();
|
|
fail_test(
|
|
r#"
|
|
def f [a b?] { echo a b c d }
|
|
f ...[5 6]"#,
|
|
"unexpected spread argument",
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn spread_non_list_args() {
|
|
fail_test(r#"echo ...(1)"#, "cannot spread value").unwrap();
|
|
assert!(nu!(r#"nu --testbin cococo ...(1)"#)
|
|
.err
|
|
.contains("cannot spread value"));
|
|
}
|
|
|
|
#[test]
|
|
fn spread_args_type() -> TestResult {
|
|
fail_test(r#"def f [...x: int] {}; f ...["abc"]"#, "expected int")
|
|
}
|
|
|
|
#[test]
|
|
fn explain_spread_args() -> TestResult {
|
|
run_test(
|
|
r#"(explain { || echo ...[1 2] }).cmd_args.0 | select arg_type name type | to nuon"#,
|
|
r#"[[arg_type, name, type]; [spread, "[1 2]", list<int>]]"#,
|
|
)
|
|
}
|
|
|
|
#[test]
|
|
fn disallow_implicit_spread_for_externals() -> TestResult {
|
|
fail_test(r#"^echo [1 2]"#, "Lists are not automatically spread")
|
|
}
|
|
|
|
#[test]
|
|
fn respect_shape() -> TestResult {
|
|
fail_test(
|
|
"def foo [...rest] { ...$rest }; foo bar baz",
|
|
"Command `...$rest` not found",
|
|
)
|
|
.unwrap();
|
|
fail_test("module foo { ...$bar }", "expected_keyword").unwrap();
|
|
run_test(r#"def "...$foo" [] {2}; do { ...$foo }"#, "2").unwrap();
|
|
run_test(r#"match "...$foo" { ...$foo => 5 }"#, "5")
|
|
}
|