2019-11-17 03:18:41 +00:00
|
|
|
use crate::commands::WholeStreamCommand;
|
|
|
|
use crate::data::{Primitive, Value};
|
|
|
|
use crate::prelude::*;
|
|
|
|
use crate::{TaggedDictBuilder, TaggedListBuilder};
|
|
|
|
use calamine::*;
|
|
|
|
use std::io::Cursor;
|
|
|
|
|
|
|
|
pub struct FromXLSX;
|
|
|
|
|
|
|
|
#[derive(Deserialize)]
|
|
|
|
pub struct FromXLSXArgs {
|
|
|
|
headerless: bool,
|
|
|
|
}
|
|
|
|
|
|
|
|
impl WholeStreamCommand for FromXLSX {
|
|
|
|
fn name(&self) -> &str {
|
|
|
|
"from-xlsx"
|
|
|
|
}
|
|
|
|
|
|
|
|
fn signature(&self) -> Signature {
|
|
|
|
Signature::build("from-xlsx")
|
|
|
|
.switch("headerless", "don't treat the first row as column names")
|
|
|
|
}
|
|
|
|
|
|
|
|
fn usage(&self) -> &str {
|
|
|
|
"Parse binary Excel(.xlsx) data and create table."
|
|
|
|
}
|
|
|
|
|
|
|
|
fn run(
|
|
|
|
&self,
|
|
|
|
args: CommandArgs,
|
|
|
|
registry: &CommandRegistry,
|
|
|
|
) -> Result<OutputStream, ShellError> {
|
|
|
|
args.process(registry, from_xlsx)?.run()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn from_xlsx(
|
|
|
|
FromXLSXArgs {
|
|
|
|
headerless: _headerless,
|
|
|
|
}: FromXLSXArgs,
|
|
|
|
runnable_context: RunnableContext,
|
|
|
|
) -> Result<OutputStream, ShellError> {
|
|
|
|
let input = runnable_context.input;
|
|
|
|
let tag = runnable_context.name;
|
|
|
|
|
|
|
|
let stream = async_stream! {
|
2019-11-21 14:33:14 +00:00
|
|
|
let values: Vec<Value> = input.values.collect().await;
|
2019-11-17 03:18:41 +00:00
|
|
|
|
|
|
|
for value in values {
|
2019-11-21 14:33:14 +00:00
|
|
|
let value_span = value.tag.span;
|
|
|
|
let value_tag = value.tag.clone();
|
|
|
|
|
|
|
|
match value.value {
|
|
|
|
UntaggedValue::Primitive(Primitive::Binary(vb)) => {
|
2019-11-17 03:18:41 +00:00
|
|
|
let mut buf: Cursor<Vec<u8>> = Cursor::new(vb);
|
|
|
|
let mut xls = Xlsx::<_>::new(buf).unwrap();
|
|
|
|
|
|
|
|
let mut dict = TaggedDictBuilder::new(&tag);
|
|
|
|
|
|
|
|
let sheet_names = xls.sheet_names().to_owned();
|
|
|
|
|
|
|
|
for sheet_name in &sheet_names {
|
|
|
|
let mut sheet_output = TaggedListBuilder::new(&tag);
|
|
|
|
|
|
|
|
let current_sheet = xls.worksheet_range(sheet_name).unwrap().unwrap();
|
|
|
|
|
|
|
|
for row in current_sheet.rows() {
|
|
|
|
let mut row_output = TaggedDictBuilder::new(&tag);
|
|
|
|
for (i, cell) in row.iter().enumerate() {
|
|
|
|
let value = match cell {
|
2019-11-21 14:33:14 +00:00
|
|
|
DataType::Empty => UntaggedValue::nothing(),
|
|
|
|
DataType::String(s) => UntaggedValue::string(s),
|
|
|
|
DataType::Float(f) => UntaggedValue::decimal(*f),
|
|
|
|
DataType::Int(i) => UntaggedValue::int(*i),
|
|
|
|
DataType::Bool(b) => UntaggedValue::boolean(*b),
|
|
|
|
_ => UntaggedValue::nothing(),
|
2019-11-17 03:18:41 +00:00
|
|
|
};
|
|
|
|
|
2019-11-21 14:33:14 +00:00
|
|
|
row_output.insert_untagged(&format!("Column{}", i), value);
|
2019-11-17 03:18:41 +00:00
|
|
|
}
|
|
|
|
|
2019-11-21 14:33:14 +00:00
|
|
|
sheet_output.push_untagged(row_output.into_untagged_value());
|
2019-11-17 03:18:41 +00:00
|
|
|
}
|
|
|
|
|
2019-11-21 14:33:14 +00:00
|
|
|
dict.insert_untagged(sheet_name, sheet_output.into_untagged_value());
|
2019-11-17 03:18:41 +00:00
|
|
|
}
|
|
|
|
|
2019-11-21 14:33:14 +00:00
|
|
|
yield ReturnSuccess::value(dict.into_value());
|
2019-11-17 03:18:41 +00:00
|
|
|
}
|
|
|
|
_ => yield Err(ShellError::labeled_error_with_secondary(
|
|
|
|
"Expected binary data from pipeline",
|
|
|
|
"requires binary data input",
|
|
|
|
&tag,
|
|
|
|
"value originates from here",
|
|
|
|
value_tag,
|
|
|
|
)),
|
|
|
|
|
|
|
|
}
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
Ok(stream.to_output_stream())
|
|
|
|
}
|