coreutils/src/cat/cat.rs

348 lines
12 KiB
Rust
Raw Normal View History

2014-07-06 08:13:36 +00:00
#![crate_name = "cat"]
2013-08-04 23:54:10 +00:00
/*
* This file is part of the uutils coreutils package.
*
* (c) Jordi Boggiano <j.boggiano@seld.be>
*
* For the full copyright and license information, please view the LICENSE
* file that was distributed with this source code.
*/
/* last synced with: cat (GNU coreutils) 8.13 */
extern crate getopts;
extern crate libc;
2013-08-04 23:54:10 +00:00
use getopts::Options;
use std::fs::File;
use std::intrinsics::{copy_nonoverlapping};
use std::io::{stdout, stdin, stderr, Write, Read, Result};
use libc::consts::os::posix88::STDIN_FILENO;
use libc::funcs::posix88::unistd::isatty;
use libc::types::os::arch::c95::c_int;
2013-08-04 23:54:10 +00:00
2015-05-29 17:51:11 +00:00
#[path = "../common/util.rs"]
#[macro_use]
mod util;
static NAME: &'static str = "cat";
static VERSION: &'static str = "1.0.0";
pub fn uumain(args: Vec<String>) -> i32 {
let mut opts = Options::new();
opts.optflag("A", "show-all", "equivalent to -vET");
opts.optflag("b", "number-nonblank",
"number nonempty output lines, overrides -n");
opts.optflag("e", "", "equivalent to -vE");
opts.optflag("E", "show-ends", "display $ at end of each line");
opts.optflag("n", "number", "number all output lines");
opts.optflag("s", "squeeze-blank", "suppress repeated empty output lines");
opts.optflag("t", "", "equivalent to -vT");
opts.optflag("T", "show-tabs", "display TAB characters as ^I");
opts.optflag("v", "show-nonprinting",
"use ^ and M- notation, except for LF (\\n) and TAB (\\t)");
opts.optflag("h", "help", "display this help and exit");
opts.optflag("V", "version", "output version information and exit");
let matches = match opts.parse(&args[1..]) {
2013-08-04 23:54:10 +00:00
Ok(m) => m,
2014-10-30 09:06:47 +00:00
Err(f) => panic!("Invalid options\n{}", f)
2013-08-04 23:54:10 +00:00
};
2013-10-22 12:22:10 +00:00
if matches.opt_present("help") {
let msg = format!("{} {}\n\n\
Usage:\n {0} [OPTION]... [FILE]...\n\n\
Concatenate FILE(s), or standard input, to standard output.\n\n\
With no FILE, or when FILE is -, read standard input.", NAME, VERSION);
print!("{}", opts.usage(&msg));
return 0;
2013-08-04 23:54:10 +00:00
}
2013-10-22 12:22:10 +00:00
if matches.opt_present("version") {
println!("{} {}", NAME, VERSION);
return 0;
2013-08-04 23:54:10 +00:00
}
2015-05-22 16:51:03 +00:00
let number_mode = if matches.opt_present("b") {
NumberingMode::NumberNonEmpty
} else if matches.opt_present("n") {
NumberingMode::NumberAll
} else {
NumberingMode::NumberNone
};
2014-11-19 20:55:25 +00:00
let show_nonprint = matches.opts_present(&["A".to_string(), "e".to_string(),
2014-05-27 21:48:37 +00:00
"t".to_string(), "v".to_string()]);
2014-11-19 20:55:25 +00:00
let show_ends = matches.opts_present(&["E".to_string(), "A".to_string(),
2014-05-27 21:48:37 +00:00
"e".to_string()]);
2014-11-19 20:55:25 +00:00
let show_tabs = matches.opts_present(&["A".to_string(), "T".to_string(),
2014-05-27 21:48:37 +00:00
"t".to_string()]);
let squeeze_blank = matches.opt_present("s");
2013-08-04 23:54:10 +00:00
let mut files = matches.free;
if files.is_empty() {
2014-05-27 21:48:37 +00:00
files.push("-".to_string());
2013-08-04 23:54:10 +00:00
}
exec(files, number_mode, show_nonprint, show_ends, show_tabs, squeeze_blank);
0
2013-08-04 23:54:10 +00:00
}
2015-01-08 12:56:41 +00:00
#[derive(Eq, PartialEq)]
2014-05-27 21:48:37 +00:00
enum NumberingMode {
2013-08-04 23:54:10 +00:00
NumberNone,
NumberNonEmpty,
NumberAll,
}
2014-05-27 21:48:37 +00:00
fn write_lines(files: Vec<String>, number: NumberingMode, squeeze_blank: bool,
show_ends: bool) {
2013-08-04 23:54:10 +00:00
2015-01-10 18:07:08 +00:00
let mut line_counter: usize = 1;
2013-08-04 23:54:10 +00:00
2015-02-22 11:55:30 +00:00
for (mut reader, interactive) in files.iter().filter_map(|p| open(&p[..])) {
2014-05-27 21:48:37 +00:00
2015-01-08 12:58:23 +00:00
let mut in_buf = [0; 1024 * 31];
let mut out_buf = [0; 1024 * 64];
let mut writer = UnsafeWriter::new(&mut out_buf[..], stdout());
2014-05-27 21:48:37 +00:00
let mut at_line_start = true;
while let Ok(n) = reader.read(&mut in_buf) {
if n == 0 { break }
let in_buf = &in_buf[..n];
let mut buf_pos = 0..n;
2014-05-27 21:48:37 +00:00
loop {
writer.possibly_flush();
let pos = match buf_pos.next() {
Some(p) => p,
None => break,
};
if in_buf[pos] == '\n' as u8 {
if !at_line_start || !squeeze_blank {
2014-11-19 20:50:37 +00:00
if at_line_start && number == NumberingMode::NumberAll {
2014-11-21 09:09:43 +00:00
(write!(&mut writer, "{0:6}\t", line_counter)).unwrap();
2014-05-27 21:48:37 +00:00
line_counter += 1;
}
if show_ends {
writer.write_all(&['$' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
}
writer.write_all(&['\n' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
if interactive {
writer.flush().unwrap();
}
}
at_line_start = true;
continue;
}
2014-11-19 20:50:37 +00:00
if at_line_start && number != NumberingMode::NumberNone {
2014-11-21 09:09:43 +00:00
(write!(&mut writer, "{0:6}\t", line_counter)).unwrap();
2014-05-27 21:48:37 +00:00
line_counter += 1;
}
match in_buf[pos..].iter().position(|c| *c == '\n' as u8) {
2014-05-27 21:48:37 +00:00
Some(p) => {
2015-01-29 07:45:08 +00:00
writer.write_all(&in_buf[pos..pos + p]).unwrap();
2014-05-27 21:48:37 +00:00
if show_ends {
writer.write_all(&['$' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
}
writer.write_all(&['\n' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
if interactive {
writer.flush().unwrap();
}
buf_pos = pos + p + 1..n;
2014-05-27 21:48:37 +00:00
at_line_start = true;
},
None => {
2015-01-29 07:45:08 +00:00
writer.write_all(&in_buf[pos..]).unwrap();
2014-05-27 21:48:37 +00:00
at_line_start = false;
break;
}
};
}
}
}
2013-08-04 23:54:10 +00:00
}
2014-05-27 21:48:37 +00:00
fn write_bytes(files: Vec<String>, number: NumberingMode, squeeze_blank: bool,
show_ends: bool, show_nonprint: bool, show_tabs: bool) {
2013-08-04 23:54:10 +00:00
2015-01-10 18:07:08 +00:00
let mut line_counter: usize = 1;
2015-02-22 11:55:30 +00:00
for (mut reader, interactive) in files.iter().filter_map(|p| open(&p[..])) {
2013-08-04 23:54:10 +00:00
2014-05-27 21:48:37 +00:00
// Flush all 1024 iterations.
let mut flush_counter = 0usize..1024;
2014-05-27 21:48:37 +00:00
2015-01-08 12:58:23 +00:00
let mut in_buf = [0; 1024 * 32];
let mut out_buf = [0; 1024 * 64];
let mut writer = UnsafeWriter::new(&mut out_buf[..], stdout());
2014-05-27 21:48:37 +00:00
let mut at_line_start = true;
while let Ok(n) = reader.read(&mut in_buf) {
if n == 0 { break }
for &byte in in_buf[..n].iter() {
2014-05-27 21:48:37 +00:00
if flush_counter.next().is_none() {
writer.possibly_flush();
flush_counter = 0usize..1024;
2014-05-27 21:48:37 +00:00
}
if byte == '\n' as u8 {
if !at_line_start || !squeeze_blank {
2014-11-19 20:50:37 +00:00
if at_line_start && number == NumberingMode::NumberAll {
2014-11-21 09:09:43 +00:00
(write!(&mut writer, "{0:6}\t", line_counter)).unwrap();
2014-05-27 21:48:37 +00:00
line_counter += 1;
2013-08-04 23:54:10 +00:00
}
2014-05-27 21:48:37 +00:00
if show_ends {
writer.write_all(&['$' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
}
writer.write_all(&['\n' as u8]).unwrap();
2014-05-27 21:48:37 +00:00
if interactive {
writer.flush().unwrap();
}
}
at_line_start = true;
continue;
}
2014-11-19 20:50:37 +00:00
if at_line_start && number != NumberingMode::NumberNone {
2014-11-21 09:09:43 +00:00
(write!(&mut writer, "{0:6}\t", line_counter)).unwrap();
2014-05-27 21:48:37 +00:00
line_counter += 1;
at_line_start = false;
2013-08-04 23:54:10 +00:00
}
2014-05-27 21:48:37 +00:00
// This code is slow because of the many branches. cat in glibc avoids
// this by having the whole loop inside show_nonprint.
if byte == '\t' as u8 {
if show_tabs {
writer.write_all("^I".as_bytes())
2014-05-27 21:48:37 +00:00
} else {
writer.write_all(&[byte])
2014-05-27 21:48:37 +00:00
}
} else if show_nonprint {
let byte = match byte {
128 ... 255 => {
writer.write_all("M-".as_bytes()).unwrap();
2014-05-27 21:48:37 +00:00
byte - 128
},
_ => byte,
};
match byte {
2015-01-29 07:45:08 +00:00
0 ... 31 => writer.write_all(&['^' as u8, byte + 64]),
127 => writer.write_all(&['^' as u8, byte - 64]),
_ => writer.write_all(&[byte]),
2014-05-27 21:48:37 +00:00
}
} else {
writer.write_all(&[byte])
2014-05-27 21:48:37 +00:00
}.unwrap();
2013-08-04 23:54:10 +00:00
}
}
}
2014-05-27 21:48:37 +00:00
}
2013-08-04 23:54:10 +00:00
2014-05-27 21:48:37 +00:00
fn write_fast(files: Vec<String>) {
let mut writer = stdout();
2015-01-08 12:58:23 +00:00
let mut in_buf = [0; 1024 * 64];
2014-05-27 21:48:37 +00:00
2015-02-22 11:55:30 +00:00
for (mut reader, _) in files.iter().filter_map(|p| open(&p[..])) {
while let Ok(n) = reader.read(&mut in_buf) {
if n == 0 { break }
// This interface is completely broken.
2015-01-29 07:45:08 +00:00
writer.write_all(&in_buf[..n]).unwrap();
2013-08-04 23:54:10 +00:00
}
}
}
2014-05-27 21:48:37 +00:00
fn exec(files: Vec<String>, number: NumberingMode, show_nonprint: bool,
show_ends: bool, show_tabs: bool, squeeze_blank: bool) {
if show_nonprint || show_tabs {
write_bytes(files, number, squeeze_blank, show_ends, show_nonprint, show_tabs);
2014-11-19 20:50:37 +00:00
} else if number != NumberingMode::NumberNone || squeeze_blank || show_ends {
2014-05-27 21:48:37 +00:00
write_lines(files, number, squeeze_blank, show_ends);
} else {
write_fast(files);
2013-08-04 23:54:10 +00:00
}
2015-05-29 17:51:11 +00:00
pipe_flush!();
2014-05-27 21:48:37 +00:00
}
2013-08-04 23:54:10 +00:00
fn open(path: &str) -> Option<(Box<Read>, bool)> {
2014-05-27 21:48:37 +00:00
if path == "-" {
let stdin = stdin();
let interactive = unsafe { isatty(STDIN_FILENO) } != 0 as c_int;
return Some((Box::new(stdin) as Box<Read>, interactive));
2013-08-04 23:54:10 +00:00
}
2014-05-27 21:48:37 +00:00
match File::open(path) {
Ok(f) => Some((Box::new(f) as Box<Read>, false)),
2014-05-27 21:48:37 +00:00
Err(e) => {
2014-11-22 06:27:54 +00:00
(writeln!(&mut stderr(), "cat: {0}: {1}", path, e.to_string())).unwrap();
None
2014-05-27 21:48:37 +00:00
},
}
2013-08-04 23:54:10 +00:00
}
2014-05-27 21:48:37 +00:00
struct UnsafeWriter<'a, W: Write> {
2014-05-27 21:48:37 +00:00
inner: W,
buf: &'a mut [u8],
2015-01-10 18:07:08 +00:00
pos: usize,
threshold: usize,
2014-05-27 21:48:37 +00:00
}
impl<'a, W: Write> UnsafeWriter<'a, W> {
2014-05-27 21:48:37 +00:00
fn new(buf: &'a mut [u8], inner: W) -> UnsafeWriter<'a, W> {
let threshold = buf.len()/2;
UnsafeWriter {
inner: inner,
buf: buf,
pos: 0,
threshold: threshold,
}
}
fn flush_buf(&mut self) -> Result<()> {
2014-05-27 21:48:37 +00:00
if self.pos != 0 {
let ret = self.inner.write(&self.buf[..self.pos]);
2014-05-27 21:48:37 +00:00
self.pos = 0;
match ret {
Ok(_) => Ok(()),
Err(e) => Err(e),
}
2014-05-27 21:48:37 +00:00
} else {
Ok(())
}
}
fn possibly_flush(&mut self) {
if self.pos > self.threshold {
2015-01-29 07:45:08 +00:00
self.inner.write_all(&self.buf[..self.pos]).unwrap();
2014-05-27 21:48:37 +00:00
self.pos = 0;
}
}
}
#[inline(never)]
fn fail() -> ! {
2014-10-30 09:06:47 +00:00
panic!("assertion failed");
2014-05-27 21:48:37 +00:00
}
impl<'a, W: Write> Write for UnsafeWriter<'a, W> {
fn write(&mut self, buf: &[u8]) -> Result<usize> {
let dst = &mut self.buf[self.pos..];
let len = buf.len();
if len > dst.len() {
2014-05-27 21:48:37 +00:00
fail();
}
unsafe {
copy_nonoverlapping(buf.as_ptr(), dst.as_mut_ptr(), len)
2014-05-27 21:48:37 +00:00
}
self.pos += len;
Ok(len)
2014-05-27 21:48:37 +00:00
}
fn flush(&mut self) -> Result<()> {
2014-05-27 21:48:37 +00:00
self.flush_buf().and_then(|()| self.inner.flush())
}
}
impl<'a, W: Write> Drop for UnsafeWriter<'a, W> {
2014-05-27 21:48:37 +00:00
fn drop(&mut self) {
let _ = self.flush_buf();
}
}
/* vim: set ai ts=4 sw=4 sts=4 et : */