2023-03-16 22:49:46 +00:00
|
|
|
use super::delimited::{from_delimited_data, trim_from_str, DelimitedReaderConfig};
|
2021-11-09 20:17:37 +00:00
|
|
|
|
2022-04-25 17:54:14 +00:00
|
|
|
use nu_engine::CallExt;
|
2021-11-09 20:17:37 +00:00
|
|
|
use nu_protocol::ast::Call;
|
|
|
|
use nu_protocol::engine::{Command, EngineState, Stack};
|
2022-11-09 21:55:05 +00:00
|
|
|
use nu_protocol::{
|
|
|
|
Category, Example, PipelineData, ShellError, Signature, Span, SyntaxShape, Type, Value,
|
|
|
|
};
|
2021-11-09 20:17:37 +00:00
|
|
|
|
|
|
|
#[derive(Clone)]
|
|
|
|
pub struct FromTsv;
|
|
|
|
|
|
|
|
impl Command for FromTsv {
|
|
|
|
fn name(&self) -> &str {
|
|
|
|
"from tsv"
|
|
|
|
}
|
|
|
|
|
|
|
|
fn signature(&self) -> Signature {
|
2021-12-31 15:54:30 +00:00
|
|
|
Signature::build("from tsv")
|
2022-11-09 21:55:05 +00:00
|
|
|
.input_output_types(vec![(Type::String, Type::Table(vec![]))])
|
2023-03-16 22:49:46 +00:00
|
|
|
.named(
|
|
|
|
"comment",
|
|
|
|
SyntaxShape::String,
|
|
|
|
"a comment character to ignore lines starting with it",
|
|
|
|
Some('c'),
|
|
|
|
)
|
|
|
|
.named(
|
|
|
|
"quote",
|
|
|
|
SyntaxShape::String,
|
|
|
|
"a quote character to ignore separators in strings, defaults to '\"'",
|
|
|
|
Some('q'),
|
|
|
|
)
|
|
|
|
.named(
|
|
|
|
"escape",
|
|
|
|
SyntaxShape::String,
|
|
|
|
"an escape character for strings containing the quote character",
|
|
|
|
Some('e'),
|
|
|
|
)
|
2021-11-17 04:22:37 +00:00
|
|
|
.switch(
|
|
|
|
"noheaders",
|
|
|
|
"don't treat the first row as column names",
|
|
|
|
Some('n'),
|
|
|
|
)
|
2023-03-16 22:49:46 +00:00
|
|
|
.switch(
|
|
|
|
"flexible",
|
|
|
|
"allow the number of fields in records to be variable",
|
|
|
|
None,
|
|
|
|
)
|
2022-05-07 20:04:31 +00:00
|
|
|
.switch("no-infer", "no field type inferencing", None)
|
2022-04-25 17:54:14 +00:00
|
|
|
.named(
|
|
|
|
"trim",
|
|
|
|
SyntaxShape::String,
|
|
|
|
"drop leading and trailing whitespaces around headers names and/or field values",
|
|
|
|
Some('t'),
|
|
|
|
)
|
2021-11-17 04:22:37 +00:00
|
|
|
.category(Category::Formats)
|
2021-11-09 20:17:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fn usage(&self) -> &str {
|
2021-12-31 15:54:30 +00:00
|
|
|
"Parse text as .tsv and create table."
|
2021-11-09 20:17:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
fn run(
|
|
|
|
&self,
|
2022-04-18 22:28:01 +00:00
|
|
|
engine_state: &EngineState,
|
2022-04-25 17:54:14 +00:00
|
|
|
stack: &mut Stack,
|
2021-11-09 20:17:37 +00:00
|
|
|
call: &Call,
|
|
|
|
input: PipelineData,
|
2023-02-05 21:17:46 +00:00
|
|
|
) -> Result<PipelineData, ShellError> {
|
2022-04-25 17:54:14 +00:00
|
|
|
from_tsv(engine_state, stack, call, input)
|
2021-11-09 20:17:37 +00:00
|
|
|
}
|
2022-02-21 12:25:41 +00:00
|
|
|
|
|
|
|
fn examples(&self) -> Vec<Example> {
|
|
|
|
vec![
|
2022-11-09 21:55:05 +00:00
|
|
|
Example {
|
|
|
|
description: "Convert tab-separated data to a table",
|
|
|
|
example: "\"ColA\tColB\n1\t2\" | from tsv",
|
|
|
|
result: Some(Value::List {
|
|
|
|
vals: vec![Value::Record {
|
|
|
|
cols: vec!["ColA".to_string(), "ColB".to_string()],
|
|
|
|
vals: vec![
|
|
|
|
Value::test_int(1),
|
|
|
|
Value::test_int(2),
|
|
|
|
],
|
|
|
|
span: Span::test_data(),
|
|
|
|
}],
|
|
|
|
span: Span::test_data(),
|
|
|
|
})
|
|
|
|
},
|
2022-02-21 12:25:41 +00:00
|
|
|
Example {
|
|
|
|
description: "Create a tsv file with header columns and open it",
|
2022-10-26 16:36:42 +00:00
|
|
|
example: r#"$'c1(char tab)c2(char tab)c3(char nl)1(char tab)2(char tab)3' | save tsv-data | open tsv-data | from tsv"#,
|
2022-02-21 12:25:41 +00:00
|
|
|
result: None,
|
|
|
|
},
|
|
|
|
Example {
|
|
|
|
description: "Create a tsv file without header columns and open it",
|
2022-10-26 16:36:42 +00:00
|
|
|
example: r#"$'a1(char tab)b1(char tab)c1(char nl)a2(char tab)b2(char tab)c2' | save tsv-data | open tsv-data | from tsv -n"#,
|
2022-02-21 12:25:41 +00:00
|
|
|
result: None,
|
|
|
|
},
|
2022-04-25 17:54:14 +00:00
|
|
|
Example {
|
|
|
|
description: "Create a tsv file without header columns and open it, removing all unnecessary whitespaces",
|
2022-10-26 16:36:42 +00:00
|
|
|
example: r#"$'a1(char tab)b1(char tab)c1(char nl)a2(char tab)b2(char tab)c2' | save tsv-data | open tsv-data | from tsv --trim all"#,
|
2022-04-25 17:54:14 +00:00
|
|
|
result: None,
|
|
|
|
},
|
|
|
|
Example {
|
|
|
|
description: "Create a tsv file without header columns and open it, removing all unnecessary whitespaces in the header names",
|
2022-10-26 16:36:42 +00:00
|
|
|
example: r#"$'a1(char tab)b1(char tab)c1(char nl)a2(char tab)b2(char tab)c2' | save tsv-data | open tsv-data | from tsv --trim headers"#,
|
2022-04-25 17:54:14 +00:00
|
|
|
result: None,
|
|
|
|
},
|
|
|
|
Example {
|
|
|
|
description: "Create a tsv file without header columns and open it, removing all unnecessary whitespaces in the field values",
|
2022-10-26 16:36:42 +00:00
|
|
|
example: r#"$'a1(char tab)b1(char tab)c1(char nl)a2(char tab)b2(char tab)c2' | save tsv-data | open tsv-data | from tsv --trim fields"#,
|
2022-04-25 17:54:14 +00:00
|
|
|
result: None,
|
|
|
|
},
|
2022-02-21 12:25:41 +00:00
|
|
|
]
|
|
|
|
}
|
2021-11-09 20:17:37 +00:00
|
|
|
}
|
|
|
|
|
2022-04-25 17:54:14 +00:00
|
|
|
fn from_tsv(
|
|
|
|
engine_state: &EngineState,
|
|
|
|
stack: &mut Stack,
|
|
|
|
call: &Call,
|
|
|
|
input: PipelineData,
|
|
|
|
) -> Result<PipelineData, ShellError> {
|
2021-11-09 20:17:37 +00:00
|
|
|
let name = call.head;
|
|
|
|
|
2023-03-16 22:49:46 +00:00
|
|
|
let comment = call
|
|
|
|
.get_flag(engine_state, stack, "comment")?
|
|
|
|
.map(|v: Value| v.as_char())
|
|
|
|
.transpose()?;
|
|
|
|
let quote = call
|
|
|
|
.get_flag(engine_state, stack, "quote")?
|
|
|
|
.map(|v: Value| v.as_char())
|
|
|
|
.transpose()?
|
|
|
|
.unwrap_or('"');
|
|
|
|
let escape = call
|
|
|
|
.get_flag(engine_state, stack, "escape")?
|
|
|
|
.map(|v: Value| v.as_char())
|
|
|
|
.transpose()?;
|
2022-05-07 20:04:31 +00:00
|
|
|
let no_infer = call.has_flag("no-infer");
|
2021-11-09 20:17:37 +00:00
|
|
|
let noheaders = call.has_flag("noheaders");
|
2023-03-16 22:49:46 +00:00
|
|
|
let flexible = call.has_flag("flexible");
|
|
|
|
let trim = trim_from_str(call.get_flag(engine_state, stack, "trim")?)?;
|
|
|
|
|
|
|
|
let config = DelimitedReaderConfig {
|
|
|
|
separator: '\t',
|
|
|
|
comment,
|
|
|
|
quote,
|
|
|
|
escape,
|
|
|
|
noheaders,
|
|
|
|
flexible,
|
|
|
|
no_infer,
|
|
|
|
trim,
|
|
|
|
};
|
2021-11-09 20:17:37 +00:00
|
|
|
|
2023-03-16 22:49:46 +00:00
|
|
|
from_delimited_data(config, input, name)
|
2021-11-09 20:17:37 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(test)]
|
|
|
|
mod test {
|
|
|
|
use super::*;
|
|
|
|
|
|
|
|
#[test]
|
|
|
|
fn test_examples() {
|
|
|
|
use crate::test_examples;
|
|
|
|
|
|
|
|
test_examples(FromTsv {})
|
|
|
|
}
|
|
|
|
}
|