mirror of
https://github.com/nushell/nushell
synced 2025-01-26 11:55:20 +00:00
A more involved solution to the issue pointed out [here](https://github.com/nushell/nushell/pull/14337#issuecomment-2480392373) # Description With `--to-table` - cell-path groupers are used to create column names, similar to `select` - closure groupers result in columns named `closure_{i}` where `i` is the index of argument, with regards to other closures i.e. first closure grouper results in a column named `closure_0` Previously - `group-by foo {...} {...}` => `table<foo, group1, group2, items>` - `group-by {...} foo {...}` => `table<group0, foo, group2, items>` With this PR - `group-by foo {...} {...}` => `table<foo, closure_0, closure_1, items>` - `group-by {...} foo {...}` => `table<closure_0, foo, closure_1, items>` - no grouper argument results in a `table<group, items>` as previously On naming conflicts caused by cell-path groupers named `items` or `closure_{i}`, an error is thrown, suggesting to use a closure in place of a cell-path. ```nushell ❯ ls | rename items | group-by items --to-table Error: × grouper arguments can't be named `items` ╭─[entry #3:1:29] 1 │ ls | rename items | group-by items --to-table · ────────┬──────── · ╰── contains `items` ╰──── help: instead of a cell-path, try using a closure ``` And following the suggestion: ```nushell ❯ ls | rename items | group-by { get items } --to-table ╭─#──┬──────closure_0──────┬───────────────────────────items────────────────────────────╮ │ 0 │ CITATION.cff │ ╭─#─┬────items─────┬─type─┬─size──┬───modified───╮ │ │ │ │ │ 0 │ CITATION.cff │ file │ 812 B │ 3 months ago │ │ │ │ │ ╰─#─┴────items─────┴─type─┴─size──┴───modified───╯ │ │ 1 │ CODE_OF_CONDUCT.md │ ╭─#─┬───────items────────┬─type─┬──size───┬───modified───╮ │ ... ```
This commit is contained in:
parent
6c36bd822c
commit
e5cec8f4eb
1 changed files with 116 additions and 51 deletions
|
@ -1,6 +1,6 @@
|
||||||
use indexmap::IndexMap;
|
use indexmap::IndexMap;
|
||||||
use nu_engine::{command_prelude::*, ClosureEval};
|
use nu_engine::{command_prelude::*, ClosureEval};
|
||||||
use nu_protocol::{engine::Closure, IntoValue};
|
use nu_protocol::{engine::Closure, FromValue, IntoValue};
|
||||||
|
|
||||||
#[derive(Clone)]
|
#[derive(Clone)]
|
||||||
pub struct GroupBy;
|
pub struct GroupBy;
|
||||||
|
@ -12,10 +12,6 @@ impl Command for GroupBy {
|
||||||
|
|
||||||
fn signature(&self) -> Signature {
|
fn signature(&self) -> Signature {
|
||||||
Signature::build("group-by")
|
Signature::build("group-by")
|
||||||
// TODO: It accepts Table also, but currently there is no Table
|
|
||||||
// example. Perhaps Table should be a subtype of List, in which case
|
|
||||||
// the current signature would suffice even when a Table example
|
|
||||||
// exists.
|
|
||||||
.input_output_types(vec![(Type::List(Box::new(Type::Any)), Type::Any)])
|
.input_output_types(vec![(Type::List(Box::new(Type::Any)), Type::Any)])
|
||||||
.switch(
|
.switch(
|
||||||
"to-table",
|
"to-table",
|
||||||
|
@ -229,7 +225,7 @@ pub fn group_by(
|
||||||
input: PipelineData,
|
input: PipelineData,
|
||||||
) -> Result<PipelineData, ShellError> {
|
) -> Result<PipelineData, ShellError> {
|
||||||
let head = call.head;
|
let head = call.head;
|
||||||
let groupers: Vec<Value> = call.rest(engine_state, stack, 0)?;
|
let groupers: Vec<Spanned<Grouper>> = call.rest(engine_state, stack, 0)?;
|
||||||
let to_table = call.has_flag(engine_state, stack, "to-table")?;
|
let to_table = call.has_flag(engine_state, stack, "to-table")?;
|
||||||
let config = engine_state.get_config();
|
let config = engine_state.get_config();
|
||||||
|
|
||||||
|
@ -238,20 +234,20 @@ pub fn group_by(
|
||||||
return Ok(Value::record(Record::new(), head).into_pipeline_data());
|
return Ok(Value::record(Record::new(), head).into_pipeline_data());
|
||||||
}
|
}
|
||||||
|
|
||||||
let mut groupers = groupers.into_iter();
|
let grouped = match &groupers[..] {
|
||||||
|
[first, rest @ ..] => {
|
||||||
let grouped = if let Some(grouper) = groupers.next() {
|
let mut grouped = Grouped::new(first.as_ref(), values, config, engine_state, stack)?;
|
||||||
let mut groups = Grouped::new(&grouper, values, config, engine_state, stack)?;
|
for grouper in rest {
|
||||||
for grouper in groupers {
|
grouped.subgroup(grouper.as_ref(), config, engine_state, stack)?;
|
||||||
groups.subgroup(&grouper, config, engine_state, stack)?;
|
}
|
||||||
|
grouped
|
||||||
}
|
}
|
||||||
groups
|
[] => Grouped::empty(values, config),
|
||||||
} else {
|
|
||||||
Grouped::empty(values, config)
|
|
||||||
};
|
};
|
||||||
|
|
||||||
let value = if to_table {
|
let value = if to_table {
|
||||||
grouped.into_table(head)
|
let column_names = groupers_to_column_names(&groupers)?;
|
||||||
|
grouped.into_table(&column_names, head)
|
||||||
} else {
|
} else {
|
||||||
grouped.into_record(head)
|
grouped.into_record(head)
|
||||||
};
|
};
|
||||||
|
@ -259,8 +255,67 @@ pub fn group_by(
|
||||||
Ok(value.into_pipeline_data())
|
Ok(value.into_pipeline_data())
|
||||||
}
|
}
|
||||||
|
|
||||||
|
fn groupers_to_column_names(groupers: &[Spanned<Grouper>]) -> Result<Vec<String>, ShellError> {
|
||||||
|
if groupers.is_empty() {
|
||||||
|
return Ok(vec!["group".into(), "items".into()]);
|
||||||
|
}
|
||||||
|
|
||||||
|
let mut closure_idx: usize = 0;
|
||||||
|
let grouper_names = groupers.iter().map(|grouper| {
|
||||||
|
grouper.as_ref().map(|item| match item {
|
||||||
|
Grouper::CellPath { val } => val.to_column_name(),
|
||||||
|
Grouper::Closure { .. } => {
|
||||||
|
closure_idx += 1;
|
||||||
|
format!("closure_{}", closure_idx - 1)
|
||||||
|
}
|
||||||
|
})
|
||||||
|
});
|
||||||
|
|
||||||
|
let mut name_set: Vec<Spanned<String>> = Vec::with_capacity(grouper_names.len());
|
||||||
|
|
||||||
|
for name in grouper_names {
|
||||||
|
if name.item == "items" {
|
||||||
|
return Err(ShellError::GenericError {
|
||||||
|
error: "grouper arguments can't be named `items`".into(),
|
||||||
|
msg: "here".into(),
|
||||||
|
span: Some(name.span),
|
||||||
|
help: Some("instead of a cell-path, try using a closure: { get items }".into()),
|
||||||
|
inner: vec![],
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
if let Some(conflicting_name) = name_set
|
||||||
|
.iter()
|
||||||
|
.find(|elem| elem.as_ref().item == name.item.as_str())
|
||||||
|
{
|
||||||
|
return Err(ShellError::GenericError {
|
||||||
|
error: "grouper arguments result in colliding column names".into(),
|
||||||
|
msg: "duplicate column names".into(),
|
||||||
|
span: Some(conflicting_name.span.append(name.span)),
|
||||||
|
help: Some(
|
||||||
|
"instead of a cell-path, try using a closure or renaming columns".into(),
|
||||||
|
),
|
||||||
|
inner: vec![ShellError::ColumnDefinedTwice {
|
||||||
|
col_name: conflicting_name.item.clone(),
|
||||||
|
first_use: conflicting_name.span,
|
||||||
|
second_use: name.span,
|
||||||
|
}],
|
||||||
|
});
|
||||||
|
}
|
||||||
|
|
||||||
|
name_set.push(name);
|
||||||
|
}
|
||||||
|
|
||||||
|
let column_names: Vec<String> = name_set
|
||||||
|
.into_iter()
|
||||||
|
.map(|elem| elem.item)
|
||||||
|
.chain(["items".into()])
|
||||||
|
.collect();
|
||||||
|
Ok(column_names)
|
||||||
|
}
|
||||||
|
|
||||||
fn group_cell_path(
|
fn group_cell_path(
|
||||||
column_name: CellPath,
|
column_name: &CellPath,
|
||||||
values: Vec<Value>,
|
values: Vec<Value>,
|
||||||
config: &nu_protocol::Config,
|
config: &nu_protocol::Config,
|
||||||
) -> Result<IndexMap<String, Vec<Value>>, ShellError> {
|
) -> Result<IndexMap<String, Vec<Value>>, ShellError> {
|
||||||
|
@ -305,8 +360,25 @@ fn group_closure(
|
||||||
Ok(groups)
|
Ok(groups)
|
||||||
}
|
}
|
||||||
|
|
||||||
|
enum Grouper {
|
||||||
|
CellPath { val: CellPath },
|
||||||
|
Closure { val: Box<Closure> },
|
||||||
|
}
|
||||||
|
|
||||||
|
impl FromValue for Grouper {
|
||||||
|
fn from_value(v: Value) -> Result<Self, ShellError> {
|
||||||
|
match v {
|
||||||
|
Value::CellPath { val, .. } => Ok(Grouper::CellPath { val }),
|
||||||
|
Value::Closure { val, .. } => Ok(Grouper::Closure { val }),
|
||||||
|
_ => Err(ShellError::TypeMismatch {
|
||||||
|
err_message: "unsupported grouper type".to_string(),
|
||||||
|
span: v.span(),
|
||||||
|
}),
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
struct Grouped {
|
struct Grouped {
|
||||||
grouper: Option<String>,
|
|
||||||
groups: Tree,
|
groups: Tree,
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -325,41 +397,35 @@ impl Grouped {
|
||||||
}
|
}
|
||||||
|
|
||||||
Self {
|
Self {
|
||||||
grouper: Some("group".into()),
|
|
||||||
groups: Tree::Leaf(groups),
|
groups: Tree::Leaf(groups),
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
fn new(
|
fn new(
|
||||||
grouper: &Value,
|
grouper: Spanned<&Grouper>,
|
||||||
values: Vec<Value>,
|
values: Vec<Value>,
|
||||||
config: &nu_protocol::Config,
|
config: &nu_protocol::Config,
|
||||||
engine_state: &EngineState,
|
engine_state: &EngineState,
|
||||||
stack: &mut Stack,
|
stack: &mut Stack,
|
||||||
) -> Result<Self, ShellError> {
|
) -> Result<Self, ShellError> {
|
||||||
let span = grouper.span();
|
let groups = match grouper.item {
|
||||||
let groups = match grouper {
|
Grouper::CellPath { val } => group_cell_path(val, values, config)?,
|
||||||
Value::CellPath { val, .. } => group_cell_path(val.clone(), values, config)?,
|
Grouper::Closure { val } => group_closure(
|
||||||
Value::Closure { val, .. } => {
|
values,
|
||||||
group_closure(values, span, Closure::clone(val), engine_state, stack)?
|
grouper.span,
|
||||||
}
|
Closure::clone(val),
|
||||||
_ => {
|
engine_state,
|
||||||
return Err(ShellError::TypeMismatch {
|
stack,
|
||||||
err_message: "unsupported grouper type".to_string(),
|
)?,
|
||||||
span,
|
|
||||||
})
|
|
||||||
}
|
|
||||||
};
|
};
|
||||||
let grouper = grouper.as_cell_path().ok().map(CellPath::to_column_name);
|
|
||||||
Ok(Self {
|
Ok(Self {
|
||||||
grouper,
|
|
||||||
groups: Tree::Leaf(groups),
|
groups: Tree::Leaf(groups),
|
||||||
})
|
})
|
||||||
}
|
}
|
||||||
|
|
||||||
fn subgroup(
|
fn subgroup(
|
||||||
&mut self,
|
&mut self,
|
||||||
grouper: &Value,
|
grouper: Spanned<&Grouper>,
|
||||||
config: &nu_protocol::Config,
|
config: &nu_protocol::Config,
|
||||||
engine_state: &EngineState,
|
engine_state: &EngineState,
|
||||||
stack: &mut Stack,
|
stack: &mut Stack,
|
||||||
|
@ -384,34 +450,33 @@ impl Grouped {
|
||||||
Ok(())
|
Ok(())
|
||||||
}
|
}
|
||||||
|
|
||||||
fn into_table(self, head: Span) -> Value {
|
fn into_table(self, column_names: &[String], head: Span) -> Value {
|
||||||
self._into_table(head, 0)
|
self._into_table(head)
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.map(|row| row.into_iter().rev().collect::<Record>().into_value(head))
|
.map(|row| {
|
||||||
|
row.into_iter()
|
||||||
|
.rev()
|
||||||
|
.zip(column_names)
|
||||||
|
.map(|(val, key)| (key.clone(), val))
|
||||||
|
.collect::<Record>()
|
||||||
|
.into_value(head)
|
||||||
|
})
|
||||||
.collect::<Vec<_>>()
|
.collect::<Vec<_>>()
|
||||||
.into_value(head)
|
.into_value(head)
|
||||||
}
|
}
|
||||||
|
|
||||||
fn _into_table(self, head: Span, index: usize) -> Vec<Record> {
|
fn _into_table(self, head: Span) -> Vec<Vec<Value>> {
|
||||||
let grouper = self.grouper.unwrap_or_else(|| format!("group{index}"));
|
|
||||||
match self.groups {
|
match self.groups {
|
||||||
Tree::Leaf(leaf) => leaf
|
Tree::Leaf(leaf) => leaf
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.map(|(group, values)| {
|
.map(|(group, values)| vec![(values.into_value(head)), (group.into_value(head))])
|
||||||
[
|
.collect::<Vec<Vec<Value>>>(),
|
||||||
("items".to_string(), values.into_value(head)),
|
|
||||||
(grouper.clone(), group.into_value(head)),
|
|
||||||
]
|
|
||||||
.into_iter()
|
|
||||||
.collect()
|
|
||||||
})
|
|
||||||
.collect::<Vec<Record>>(),
|
|
||||||
Tree::Branch(branch) => branch
|
Tree::Branch(branch) => branch
|
||||||
.into_iter()
|
.into_iter()
|
||||||
.flat_map(|(group, items)| {
|
.flat_map(|(group, items)| {
|
||||||
let mut inner = items._into_table(head, index + 1);
|
let mut inner = items._into_table(head);
|
||||||
for row in &mut inner {
|
for row in &mut inner {
|
||||||
row.insert(grouper.clone(), group.clone().into_value(head));
|
row.push(group.clone().into_value(head));
|
||||||
}
|
}
|
||||||
inner
|
inner
|
||||||
})
|
})
|
||||||
|
|
Loading…
Reference in a new issue