2019-09-03 06:04:46 +00:00
|
|
|
use crate::commands::UnevaluatedCallInfo;
|
|
|
|
use crate::context::SpanSource;
|
2019-09-18 06:37:04 +00:00
|
|
|
use crate::data::meta::Span;
|
2019-09-05 16:23:42 +00:00
|
|
|
use crate::data::Value;
|
2019-09-03 06:04:46 +00:00
|
|
|
use crate::errors::ShellError;
|
2019-09-14 16:30:24 +00:00
|
|
|
use crate::parser::hir::SyntaxShape;
|
2019-09-03 06:04:46 +00:00
|
|
|
use crate::parser::registry::Signature;
|
|
|
|
use crate::prelude::*;
|
|
|
|
use mime::Mime;
|
|
|
|
use std::path::PathBuf;
|
|
|
|
use std::str::FromStr;
|
|
|
|
use surf::mime;
|
2019-09-18 06:37:04 +00:00
|
|
|
use uuid::Uuid;
|
2019-09-03 06:04:46 +00:00
|
|
|
pub struct Fetch;
|
|
|
|
|
|
|
|
impl PerItemCommand for Fetch {
|
|
|
|
fn name(&self) -> &str {
|
|
|
|
"fetch"
|
|
|
|
}
|
|
|
|
|
|
|
|
fn signature(&self) -> Signature {
|
|
|
|
Signature::build(self.name())
|
2019-09-14 16:30:24 +00:00
|
|
|
.required("path", SyntaxShape::Path)
|
2019-09-03 06:04:46 +00:00
|
|
|
.switch("raw")
|
|
|
|
}
|
|
|
|
|
|
|
|
fn usage(&self) -> &str {
|
|
|
|
"Load from a URL into a cell, convert to table if possible (avoid by appending '--raw')"
|
|
|
|
}
|
|
|
|
|
|
|
|
fn run(
|
|
|
|
&self,
|
|
|
|
call_info: &CallInfo,
|
|
|
|
registry: &CommandRegistry,
|
|
|
|
raw_args: &RawCommandArgs,
|
|
|
|
_input: Tagged<Value>,
|
|
|
|
) -> Result<OutputStream, ShellError> {
|
|
|
|
run(call_info, registry, raw_args)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
fn run(
|
|
|
|
call_info: &CallInfo,
|
|
|
|
registry: &CommandRegistry,
|
|
|
|
raw_args: &RawCommandArgs,
|
|
|
|
) -> Result<OutputStream, ShellError> {
|
|
|
|
let path = match call_info
|
|
|
|
.args
|
|
|
|
.nth(0)
|
|
|
|
.ok_or_else(|| ShellError::string(&format!("No file or directory specified")))?
|
|
|
|
{
|
|
|
|
file => file,
|
|
|
|
};
|
|
|
|
let path_buf = path.as_path()?;
|
|
|
|
let path_str = path_buf.display().to_string();
|
2019-09-18 06:37:04 +00:00
|
|
|
let path_span = path.span();
|
2019-09-03 06:04:46 +00:00
|
|
|
let has_raw = call_info.args.has("raw");
|
|
|
|
let registry = registry.clone();
|
|
|
|
let raw_args = raw_args.clone();
|
|
|
|
|
2019-09-26 00:22:17 +00:00
|
|
|
let stream = async_stream! {
|
2019-09-03 06:04:46 +00:00
|
|
|
|
2019-09-18 06:37:04 +00:00
|
|
|
let result = fetch(&path_str, path_span).await;
|
2019-09-03 06:04:46 +00:00
|
|
|
|
|
|
|
if let Err(e) = result {
|
|
|
|
yield Err(e);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
let (file_extension, contents, contents_tag, span_source) = result.unwrap();
|
|
|
|
|
|
|
|
let file_extension = if has_raw {
|
|
|
|
None
|
|
|
|
} else {
|
|
|
|
// If the extension could not be determined via mimetype, try to use the path
|
|
|
|
// extension. Some file types do not declare their mimetypes (such as bson files).
|
|
|
|
file_extension.or(path_str.split('.').last().map(String::from))
|
|
|
|
};
|
|
|
|
|
2019-09-29 05:13:56 +00:00
|
|
|
if contents_tag.anchor != uuid::Uuid::nil() {
|
2019-09-03 06:04:46 +00:00
|
|
|
// If we have loaded something, track its source
|
|
|
|
yield ReturnSuccess::action(CommandAction::AddSpanSource(
|
2019-09-29 05:13:56 +00:00
|
|
|
contents_tag.anchor,
|
2019-09-03 06:04:46 +00:00
|
|
|
span_source,
|
|
|
|
));
|
|
|
|
}
|
|
|
|
|
|
|
|
let tagged_contents = contents.tagged(contents_tag);
|
|
|
|
|
|
|
|
if let Some(extension) = file_extension {
|
|
|
|
let command_name = format!("from-{}", extension);
|
|
|
|
if let Some(converter) = registry.get_command(&command_name) {
|
|
|
|
let new_args = RawCommandArgs {
|
|
|
|
host: raw_args.host,
|
|
|
|
shell_manager: raw_args.shell_manager,
|
|
|
|
call_info: UnevaluatedCallInfo {
|
|
|
|
args: crate::parser::hir::Call {
|
|
|
|
head: raw_args.call_info.args.head,
|
|
|
|
positional: None,
|
|
|
|
named: None
|
|
|
|
},
|
|
|
|
source: raw_args.call_info.source,
|
|
|
|
source_map: raw_args.call_info.source_map,
|
2019-09-14 16:30:24 +00:00
|
|
|
name_tag: raw_args.call_info.name_tag,
|
2019-09-03 06:04:46 +00:00
|
|
|
}
|
|
|
|
};
|
2019-09-17 02:09:15 +00:00
|
|
|
let mut result = converter.run(new_args.with_input(vec![tagged_contents]), ®istry, false);
|
2019-09-03 06:04:46 +00:00
|
|
|
let result_vec: Vec<Result<ReturnSuccess, ShellError>> = result.drain_vec().await;
|
|
|
|
for res in result_vec {
|
|
|
|
match res {
|
2019-09-05 16:23:42 +00:00
|
|
|
Ok(ReturnSuccess::Value(Tagged { item: Value::Table(list), ..})) => {
|
2019-09-03 06:04:46 +00:00
|
|
|
for l in list {
|
|
|
|
yield Ok(ReturnSuccess::Value(l));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
Ok(ReturnSuccess::Value(Tagged { item, .. })) => {
|
|
|
|
yield Ok(ReturnSuccess::Value(Tagged { item, tag: contents_tag }));
|
|
|
|
}
|
|
|
|
x => yield x,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
yield ReturnSuccess::value(tagged_contents);
|
|
|
|
}
|
|
|
|
} else {
|
|
|
|
yield ReturnSuccess::value(tagged_contents);
|
|
|
|
}
|
|
|
|
};
|
|
|
|
|
|
|
|
Ok(stream.to_output_stream())
|
|
|
|
}
|
|
|
|
|
|
|
|
pub async fn fetch(
|
|
|
|
location: &str,
|
2019-09-18 06:37:04 +00:00
|
|
|
span: Span,
|
2019-09-03 06:04:46 +00:00
|
|
|
) -> Result<(Option<String>, Value, Tag, SpanSource), ShellError> {
|
|
|
|
if let Err(_) = url::Url::parse(location) {
|
|
|
|
return Err(ShellError::labeled_error(
|
|
|
|
"Incomplete or incorrect url",
|
|
|
|
"expected a full url",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
));
|
|
|
|
}
|
|
|
|
|
|
|
|
let response = surf::get(location).await;
|
|
|
|
match response {
|
|
|
|
Ok(mut r) => match r.headers().get("content-type") {
|
|
|
|
Some(content_type) => {
|
|
|
|
let content_type = Mime::from_str(content_type).unwrap();
|
|
|
|
match (content_type.type_(), content_type.subtype()) {
|
|
|
|
(mime::APPLICATION, mime::XML) => Ok((
|
|
|
|
Some("xml".to_string()),
|
|
|
|
Value::string(r.body_string().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load text from remote url",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
(mime::APPLICATION, mime::JSON) => Ok((
|
|
|
|
Some("json".to_string()),
|
|
|
|
Value::string(r.body_string().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load text from remote url",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
(mime::APPLICATION, mime::OCTET_STREAM) => {
|
|
|
|
let buf: Vec<u8> = r.body_bytes().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load binary file",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?;
|
|
|
|
Ok((
|
|
|
|
None,
|
2019-09-14 16:30:24 +00:00
|
|
|
Value::binary(buf),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
))
|
|
|
|
}
|
|
|
|
(mime::IMAGE, mime::SVG) => Ok((
|
|
|
|
Some("svg".to_string()),
|
|
|
|
Value::string(r.body_string().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load svg from remote url",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
(mime::IMAGE, image_ty) => {
|
|
|
|
let buf: Vec<u8> = r.body_bytes().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load image file",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?;
|
|
|
|
Ok((
|
|
|
|
Some(image_ty.to_string()),
|
2019-09-14 16:30:24 +00:00
|
|
|
Value::binary(buf),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
))
|
|
|
|
}
|
|
|
|
(mime::TEXT, mime::HTML) => Ok((
|
|
|
|
Some("html".to_string()),
|
|
|
|
Value::string(r.body_string().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load text from remote url",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
(mime::TEXT, mime::PLAIN) => {
|
|
|
|
let path_extension = url::Url::parse(location)
|
|
|
|
.unwrap()
|
|
|
|
.path_segments()
|
|
|
|
.and_then(|segments| segments.last())
|
|
|
|
.and_then(|name| if name.is_empty() { None } else { Some(name) })
|
|
|
|
.and_then(|name| {
|
|
|
|
PathBuf::from(name)
|
|
|
|
.extension()
|
|
|
|
.map(|name| name.to_string_lossy().to_string())
|
|
|
|
});
|
|
|
|
|
|
|
|
Ok((
|
|
|
|
path_extension,
|
|
|
|
Value::string(r.body_string().await.map_err(|_| {
|
|
|
|
ShellError::labeled_error(
|
|
|
|
"Could not load text from remote url",
|
|
|
|
"could not load",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
)
|
|
|
|
})?),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
))
|
|
|
|
}
|
|
|
|
(ty, sub_ty) => Ok((
|
|
|
|
None,
|
|
|
|
Value::string(format!("Not yet supported MIME type: {} {}", ty, sub_ty)),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
None => Ok((
|
|
|
|
None,
|
|
|
|
Value::string(format!("No content type found")),
|
2019-09-18 06:37:04 +00:00
|
|
|
Tag {
|
|
|
|
span,
|
2019-09-29 05:13:56 +00:00
|
|
|
anchor: Uuid::new_v4(),
|
2019-09-18 06:37:04 +00:00
|
|
|
},
|
2019-09-03 06:04:46 +00:00
|
|
|
SpanSource::Url(location.to_string()),
|
|
|
|
)),
|
|
|
|
},
|
|
|
|
Err(_) => {
|
|
|
|
return Err(ShellError::labeled_error(
|
|
|
|
"URL could not be opened",
|
|
|
|
"url not found",
|
2019-09-18 06:37:04 +00:00
|
|
|
span,
|
2019-09-03 06:04:46 +00:00
|
|
|
));
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|