bat/src/input.rs

288 lines
7.9 KiB
Rust
Raw Normal View History

use std::ffi::{OsStr, OsString};
2018-10-07 09:54:01 +00:00
use std::fs::File;
2020-04-21 19:14:44 +00:00
use std::io::{self, BufRead, BufReader, Read};
2018-10-07 09:54:01 +00:00
2018-10-07 14:44:59 +00:00
use content_inspector::{self, ContentType};
2020-04-22 19:45:47 +00:00
use crate::error::*;
2018-10-07 09:54:01 +00:00
2020-05-15 23:18:10 +00:00
/// A description of an Input source.
2020-05-15 21:21:38 +00:00
/// This tells bat how to refer to the input.
2020-05-15 23:18:10 +00:00
#[derive(Clone)]
pub struct InputDescription {
name: String,
kind: Option<String>,
summary: Option<String>,
}
impl InputDescription {
/// Creates a description for an input.
///
2020-05-16 01:38:05 +00:00
/// The name should describe where the input came from (e.g. "README.md")
2020-05-15 23:18:10 +00:00
pub fn new(name: impl Into<String>) -> Self {
InputDescription {
name: name.into(),
kind: None,
summary: None,
}
}
2020-05-15 21:21:38 +00:00
2020-05-15 23:18:10 +00:00
/// A description for the type of input (e.g. "File")
pub fn with_kind(mut self, kind: Option<impl Into<String>>) -> Self {
self.kind = kind.map(|kind| kind.into());
self
}
/// A summary description of the input.
///
/// Defaults to "{kind} '{name}'"
pub fn with_summary(mut self, summary: Option<impl Into<String>>) -> Self {
self.summary = summary.map(|summary| summary.into());
self
}
pub fn name(&self) -> &String {
&self.name
}
2020-05-15 21:21:38 +00:00
2020-05-15 23:18:10 +00:00
pub fn kind(&self) -> Option<&String> {
self.kind.as_ref()
}
pub fn summary(&self) -> String {
self.summary.clone().unwrap_or_else(|| match &self.kind {
None => self.name.clone(),
Some(kind) => format!("{} '{}'", kind.to_lowercase(), self.name),
})
}
2020-04-21 20:24:47 +00:00
}
2020-04-22 16:30:06 +00:00
pub(crate) enum InputKind<'a> {
2020-04-22 14:27:34 +00:00
OrdinaryFile(OsString),
StdIn,
CustomReader(Box<dyn Read + 'a>),
2020-04-22 14:27:34 +00:00
}
2020-05-15 23:18:10 +00:00
impl<'a> InputKind<'a> {
pub fn description(&self) -> InputDescription {
match self {
InputKind::OrdinaryFile(ref path) => {
InputDescription::new(path.to_string_lossy()).with_kind(Some("File"))
}
InputKind::StdIn => InputDescription::new("STDIN"),
InputKind::CustomReader(_) => InputDescription::new("READER"),
}
}
}
2020-04-22 14:27:34 +00:00
#[derive(Clone, Default)]
2020-04-22 16:30:06 +00:00
pub(crate) struct InputMetadata {
pub(crate) user_provided_name: Option<OsString>,
2020-04-22 14:27:34 +00:00
}
pub struct Input<'a> {
2020-04-22 16:30:06 +00:00
pub(crate) kind: InputKind<'a>,
pub(crate) metadata: InputMetadata,
2020-05-15 23:18:10 +00:00
pub(crate) description: Option<InputDescription>,
2020-04-22 14:27:34 +00:00
}
2020-04-22 16:30:06 +00:00
pub(crate) enum OpenedInputKind {
2020-04-22 14:27:34 +00:00
OrdinaryFile(OsString),
StdIn,
CustomReader,
}
2020-04-22 16:30:06 +00:00
pub(crate) struct OpenedInput<'a> {
pub(crate) kind: OpenedInputKind,
pub(crate) metadata: InputMetadata,
pub(crate) reader: InputReader<'a>,
2020-05-15 23:18:10 +00:00
pub(crate) description: InputDescription,
2018-10-07 09:21:41 +00:00
}
2018-10-07 09:54:01 +00:00
impl<'a> Input<'a> {
2020-04-22 14:27:34 +00:00
pub fn ordinary_file(path: &OsStr) -> Self {
Input {
kind: InputKind::OrdinaryFile(path.to_os_string()),
metadata: InputMetadata::default(),
2020-05-15 23:18:10 +00:00
description: None,
2018-10-07 09:54:01 +00:00
}
}
2020-04-21 20:24:47 +00:00
2020-04-22 14:27:34 +00:00
pub fn stdin() -> Self {
Input {
kind: InputKind::StdIn,
metadata: InputMetadata::default(),
2020-05-15 23:18:10 +00:00
description: None,
2020-04-22 14:27:34 +00:00
}
}
pub fn from_reader(reader: Box<dyn Read + 'a>) -> Self {
Input {
kind: InputKind::CustomReader(reader),
metadata: InputMetadata::default(),
2020-05-15 23:18:10 +00:00
description: None,
}
}
2020-04-22 14:27:34 +00:00
pub fn is_stdin(&self) -> bool {
if let InputKind::StdIn = self.kind {
true
} else {
false
}
}
2020-04-22 20:41:25 +00:00
pub fn with_name(mut self, provided_name: Option<&OsStr>) -> Self {
2020-04-22 14:27:34 +00:00
self.metadata.user_provided_name = provided_name.map(|n| n.to_owned());
2020-04-22 20:41:25 +00:00
self
2020-04-22 14:27:34 +00:00
}
2020-05-15 23:18:10 +00:00
pub fn with_description(mut self, description: Option<InputDescription>) -> Self {
self.description = description;
self
}
pub fn description(&self) -> InputDescription {
if let Some(ref description) = self.description {
description.clone()
} else if let Some(ref name) = self.metadata.user_provided_name {
InputDescription::new(name.to_string_lossy()).with_kind(Some("File"))
} else {
self.kind.description()
}
}
2020-04-22 16:30:06 +00:00
pub(crate) fn open<R: BufRead + 'a>(self, stdin: R) -> Result<OpenedInput<'a>> {
2020-05-15 23:18:10 +00:00
let description = self.description().clone();
2020-04-22 14:27:34 +00:00
match self.kind {
InputKind::StdIn => Ok(OpenedInput {
kind: OpenedInputKind::StdIn,
2020-05-15 23:18:10 +00:00
description,
2020-04-22 14:27:34 +00:00
metadata: self.metadata,
reader: InputReader::new(stdin),
}),
InputKind::OrdinaryFile(path) => Ok(OpenedInput {
kind: OpenedInputKind::OrdinaryFile(path.clone()),
2020-05-15 23:18:10 +00:00
description,
2020-04-22 14:27:34 +00:00
metadata: self.metadata,
reader: {
let file = File::open(&path)
.map_err(|e| format!("'{}': {}", path.to_string_lossy(), e))?;
if file.metadata()?.is_dir() {
return Err(format!("'{}' is a directory.", path.to_string_lossy()).into());
}
InputReader::new(BufReader::new(file))
},
}),
InputKind::CustomReader(reader) => Ok(OpenedInput {
2020-05-15 23:18:10 +00:00
description,
2020-04-22 14:27:34 +00:00
kind: OpenedInputKind::CustomReader,
metadata: self.metadata,
reader: InputReader::new(BufReader::new(reader)),
}),
}
}
}
2020-04-22 16:30:06 +00:00
pub(crate) struct InputReader<'a> {
2020-04-21 20:24:47 +00:00
inner: Box<dyn BufRead + 'a>,
pub(crate) first_line: Vec<u8>,
pub(crate) content_type: Option<ContentType>,
}
impl<'a> InputReader<'a> {
fn new<R: BufRead + 'a>(mut reader: R) -> InputReader<'a> {
let mut first_line = vec![];
reader.read_until(b'\n', &mut first_line).ok();
let content_type = if first_line.is_empty() {
None
} else {
Some(content_inspector::inspect(&first_line[..]))
};
if content_type == Some(ContentType::UTF_16LE) {
reader.read_until(0x00, &mut first_line).ok();
}
InputReader {
inner: Box::new(reader),
first_line,
content_type,
}
}
pub(crate) fn read_line(&mut self, buf: &mut Vec<u8>) -> io::Result<bool> {
if self.first_line.is_empty() {
let res = self.inner.read_until(b'\n', buf).map(|size| size > 0)?;
if self.content_type == Some(ContentType::UTF_16LE) {
self.inner.read_until(0x00, buf).ok();
}
Ok(res)
} else {
buf.append(&mut self.first_line);
Ok(true)
}
}
2018-10-07 09:54:01 +00:00
}
2018-10-07 10:29:38 +00:00
#[test]
fn basic() {
2018-10-07 11:25:49 +00:00
let content = b"#!/bin/bash\necho hello";
2020-04-21 19:19:06 +00:00
let mut reader = InputReader::new(&content[..]);
2018-10-07 10:29:38 +00:00
2018-10-07 11:47:54 +00:00
assert_eq!(b"#!/bin/bash\n", &reader.first_line[..]);
2018-10-07 11:25:49 +00:00
2018-10-07 10:29:38 +00:00
let mut buffer = vec![];
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(true, res.unwrap());
2018-10-07 11:25:49 +00:00
assert_eq!(b"#!/bin/bash\n", &buffer[..]);
2018-10-07 10:29:38 +00:00
buffer.clear();
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(true, res.unwrap());
2018-10-07 11:25:49 +00:00
assert_eq!(b"echo hello", &buffer[..]);
2018-10-07 10:29:38 +00:00
buffer.clear();
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(false, res.unwrap());
assert!(buffer.is_empty());
}
2018-10-07 14:44:59 +00:00
#[test]
fn utf16le() {
let content = b"\xFF\xFE\x73\x00\x0A\x00\x64\x00";
2020-04-21 19:19:06 +00:00
let mut reader = InputReader::new(&content[..]);
2018-10-07 14:44:59 +00:00
assert_eq!(b"\xFF\xFE\x73\x00\x0A\x00", &reader.first_line[..]);
let mut buffer = vec![];
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(true, res.unwrap());
assert_eq!(b"\xFF\xFE\x73\x00\x0A\x00", &buffer[..]);
buffer.clear();
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(true, res.unwrap());
assert_eq!(b"\x64\x00", &buffer[..]);
buffer.clear();
let res = reader.read_line(&mut buffer);
assert!(res.is_ok());
assert_eq!(false, res.unwrap());
assert!(buffer.is_empty());
}