coreutils/tests/test_split.rs

extern crate rand;
extern crate regex;

use self::rand::{thread_rng, Rng};
use self::regex::Regex;
use common::util::*;
use std::fs::{read_dir, File};
use std::io::Write;
use std::path::Path;

fn random_chars(n: usize) -> String {
    thread_rng()
        .sample_iter(&rand::distributions::Alphanumeric)
        .take(n)
        .collect::<String>()
}

struct Glob {
    directory: AtPath,
    regex: Regex,
}

impl Glob {
    fn new(at: &AtPath, directory: &str, regex: &str) -> Glob {
        Glob {
            directory: AtPath::new(Path::new(&at.plus_as_string(directory))),
            regex: Regex::new(regex).unwrap(),
        }
    }

    fn count(&self) -> usize {
        self.collect().len()
    }

    fn collect(&self) -> Vec<String> {
        read_dir(Path::new(&self.directory.subdir))
            .unwrap()
            .filter_map(|entry| {
                let path = entry.unwrap().path();
                let name = self
                    .directory
                    .minus_as_string(path.as_path().to_str().unwrap_or(""));
                if self.regex.is_match(&name) {
                    Some(name)
                } else {
                    None
                }
            })
            .collect()
    }

    fn collate(&self) -> Vec<u8> {
        let mut files = self.collect();
        files.sort();
        let mut data: Vec<u8> = vec![];
        for name in &files {
            data.extend(self.directory.read(name).into_bytes());
        }
        data
    }
}

struct RandomFile {
    inner: File,
}

impl RandomFile {
    fn new(at: &AtPath, name: &str) -> RandomFile {
        RandomFile {
            inner: File::create(&at.plus(name)).unwrap(),
        }
    }

    fn add_bytes(&mut self, bytes: usize) {
        let chunk_size: usize = if bytes >= 1024 { 1024 } else { bytes };
        let mut n = bytes;
        while n > chunk_size {
            let _ = write!(self.inner, "{}", random_chars(chunk_size));
            n -= chunk_size;
        }
        let _ = write!(self.inner, "{}", random_chars(n));
    }

    fn add_lines(&mut self, lines: usize) {
        let line_size: usize = 32;
        let mut n = lines;
        while n > 0 {
            let _ = writeln!(self.inner, "{}", random_chars(line_size));
            n -= 1;
        }
    }
}

#[test]
fn test_split_default() {
    let (at, mut ucmd) = at_and_ucmd!();
    let name = "split_default";
    let glob = Glob::new(&at, ".", r"x[[:alpha:]][[:alpha:]]$");
    RandomFile::new(&at, name).add_lines(2000);
    ucmd.args(&[name]).succeeds();
    assert_eq!(glob.count(), 2);
    assert_eq!(glob.collate(), at.read(name).into_bytes());
}

#[test]
fn test_split_num_prefixed_chunks_by_bytes() {
    let (at, mut ucmd) = at_and_ucmd!();
    let name = "split_num_prefixed_chunks_by_bytes";
    let glob = Glob::new(&at, ".", r"a\d\d$");
    RandomFile::new(&at, name).add_bytes(10000);
    ucmd.args(&["-d", "-b", "1000", name, "a"]).succeeds();
    assert_eq!(glob.count(), 10);
    assert_eq!(glob.collate(), at.read(name).into_bytes());
}

#[test]
fn test_split_str_prefixed_chunks_by_bytes() {
    let (at, mut ucmd) = at_and_ucmd!();
    let name = "split_str_prefixed_chunks_by_bytes";
    let glob = Glob::new(&at, ".", r"b[[:alpha:]][[:alpha:]]$");
    RandomFile::new(&at, name).add_bytes(10000);
    ucmd.args(&["-b", "1000", name, "b"]).succeeds();
    assert_eq!(glob.count(), 10);
    assert_eq!(glob.collate(), at.read(name).into_bytes());
}

#[test]
fn test_split_num_prefixed_chunks_by_lines() {
    let (at, mut ucmd) = at_and_ucmd!();
    let name = "split_num_prefixed_chunks_by_lines";
    let glob = Glob::new(&at, ".", r"c\d\d$");
    RandomFile::new(&at, name).add_lines(10000);
    ucmd.args(&["-d", "-l", "1000", name, "c"]).succeeds();
    assert_eq!(glob.count(), 10);
    assert_eq!(glob.collate(), at.read(name).into_bytes());
}

#[test]
fn test_split_str_prefixed_chunks_by_lines() {
    let (at, mut ucmd) = at_and_ucmd!();
    let name = "split_str_prefixed_chunks_by_lines";
    let glob = Glob::new(&at, ".", r"d[[:alpha:]][[:alpha:]]$");
    RandomFile::new(&at, name).add_lines(10000);
    ucmd.args(&["-l", "1000", name, "d"]).succeeds();
    assert_eq!(glob.count(), 10);
    assert_eq!(glob.collate(), at.read(name).into_bytes());
}
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`extern crate rand;`
			`extern crate regex;`

rustfmt the tests 2020-04-13 18:36:03 +00:00			`use self::rand::{thread_rng, Rng};`
tests: extern crates in separated test modules 2016-08-06 03:18:34 +00:00			`use self::regex::Regex;`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`use common::util::*;`
rustfmt the tests 2020-04-13 18:36:03 +00:00			`use std::fs::{read_dir, File};`
			`use std::io::Write;`
			`use std::path::Path;`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00
			`fn random_chars(n: usize) -> String {`
rustfmt the tests 2020-04-13 18:36:03 +00:00			`thread_rng()`
			`.sample_iter(&rand::distributions::Alphanumeric)`
			`.take(n)`
			`.collect::<String>()`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`}`

			`struct Glob {`
			`directory: AtPath,`
			`regex: Regex,`
			`}`

			`impl Glob {`
			`fn new(at: &AtPath, directory: &str, regex: &str) -> Glob {`
			`Glob {`
			`directory: AtPath::new(Path::new(&at.plus_as_string(directory))),`
			`regex: Regex::new(regex).unwrap(),`
			`}`
			`}`

			`fn count(&self) -> usize {`
			`self.collect().len()`
			`}`

			`fn collect(&self) -> Vec<String> {`
			`read_dir(Path::new(&self.directory.subdir))`
			`.unwrap()`
			`.filter_map(\|entry\| {`
			`let path = entry.unwrap().path();`
rustfmt the tests 2020-04-13 18:36:03 +00:00			`let name = self`
			`.directory`
			`.minus_as_string(path.as_path().to_str().unwrap_or(""));`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`if self.regex.is_match(&name) {`
			`Some(name)`
			`} else {`
			`None`
			`}`
			`})`
			`.collect()`
			`}`

			`fn collate(&self) -> Vec<u8> {`
			`let mut files = self.collect();`
			`files.sort();`
			`let mut data: Vec<u8> = vec![];`
Fix clippy warnings 2016-11-25 19:14:46 +00:00			`for name in &files {`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`data.extend(self.directory.read(name).into_bytes());`
			`}`
			`data`
			`}`
			`}`

			`struct RandomFile {`
			`inner: File,`
			`}`

			`impl RandomFile {`
			`fn new(at: &AtPath, name: &str) -> RandomFile {`
rustfmt the tests 2020-04-13 18:36:03 +00:00			`RandomFile {`
			`inner: File::create(&at.plus(name)).unwrap(),`
			`}`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`}`

			`fn add_bytes(&mut self, bytes: usize) {`
rustfmt the tests 2020-04-13 18:36:03 +00:00			`let chunk_size: usize = if bytes >= 1024 { 1024 } else { bytes };`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let mut n = bytes;`
			`while n > chunk_size {`
			`let _ = write!(self.inner, "{}", random_chars(chunk_size));`
			`n -= chunk_size;`
			`}`
			`let _ = write!(self.inner, "{}", random_chars(n));`
			`}`

			`fn add_lines(&mut self, lines: usize) {`
			`let line_size: usize = 32;`
			`let mut n = lines;`
			`while n > 0 {`
			`let _ = writeln!(self.inner, "{}", random_chars(line_size));`
			`n -= 1;`
			`}`
			`}`
			`}`

			`#[test]`
			`fn test_split_default() {`
tests: remove helper function boilerplate via macros 2016-08-23 11:52:43 +00:00			`let (at, mut ucmd) = at_and_ucmd!();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let name = "split_default";`
Update for changes in regex 2017-01-11 23:45:21 +00:00			`let glob = Glob::new(&at, ".", r"x[[:alpha:]][[:alpha:]]$");`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`RandomFile::new(&at, name).add_lines(2000);`
tests: normalize around chaining asserts Although for some tests this adds characters we still use them there because the brevity cost is now worth the benefit in terms of instant, natural-language readability and recognizability for people not familiar with this tests of this module or even the project 2016-08-13 21:59:21 +00:00			`ucmd.args(&[name]).succeeds();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`assert_eq!(glob.count(), 2);`
			`assert_eq!(glob.collate(), at.read(name).into_bytes());`
			`}`

			`#[test]`
			`fn test_split_num_prefixed_chunks_by_bytes() {`
tests: remove helper function boilerplate via macros 2016-08-23 11:52:43 +00:00			`let (at, mut ucmd) = at_and_ucmd!();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let name = "split_num_prefixed_chunks_by_bytes";`
			`let glob = Glob::new(&at, ".", r"a\d\d$");`
			`RandomFile::new(&at, name).add_bytes(10000);`
tests: normalize around chaining asserts Although for some tests this adds characters we still use them there because the brevity cost is now worth the benefit in terms of instant, natural-language readability and recognizability for people not familiar with this tests of this module or even the project 2016-08-13 21:59:21 +00:00			`ucmd.args(&["-d", "-b", "1000", name, "a"]).succeeds();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`assert_eq!(glob.count(), 10);`
			`assert_eq!(glob.collate(), at.read(name).into_bytes());`
			`}`

			`#[test]`
			`fn test_split_str_prefixed_chunks_by_bytes() {`
tests: remove helper function boilerplate via macros 2016-08-23 11:52:43 +00:00			`let (at, mut ucmd) = at_and_ucmd!();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let name = "split_str_prefixed_chunks_by_bytes";`
Update for changes in regex 2017-01-11 23:45:21 +00:00			`let glob = Glob::new(&at, ".", r"b[[:alpha:]][[:alpha:]]$");`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`RandomFile::new(&at, name).add_bytes(10000);`
tests: normalize around chaining asserts Although for some tests this adds characters we still use them there because the brevity cost is now worth the benefit in terms of instant, natural-language readability and recognizability for people not familiar with this tests of this module or even the project 2016-08-13 21:59:21 +00:00			`ucmd.args(&["-b", "1000", name, "b"]).succeeds();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`assert_eq!(glob.count(), 10);`
			`assert_eq!(glob.collate(), at.read(name).into_bytes());`
			`}`

			`#[test]`
			`fn test_split_num_prefixed_chunks_by_lines() {`
tests: remove helper function boilerplate via macros 2016-08-23 11:52:43 +00:00			`let (at, mut ucmd) = at_and_ucmd!();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let name = "split_num_prefixed_chunks_by_lines";`
			`let glob = Glob::new(&at, ".", r"c\d\d$");`
			`RandomFile::new(&at, name).add_lines(10000);`
tests: normalize around chaining asserts Although for some tests this adds characters we still use them there because the brevity cost is now worth the benefit in terms of instant, natural-language readability and recognizability for people not familiar with this tests of this module or even the project 2016-08-13 21:59:21 +00:00			`ucmd.args(&["-d", "-l", "1000", name, "c"]).succeeds();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`assert_eq!(glob.count(), 10);`
			`assert_eq!(glob.collate(), at.read(name).into_bytes());`
			`}`

			`#[test]`
			`fn test_split_str_prefixed_chunks_by_lines() {`
tests: remove helper function boilerplate via macros 2016-08-23 11:52:43 +00:00			`let (at, mut ucmd) = at_and_ucmd!();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`let name = "split_str_prefixed_chunks_by_lines";`
Update for changes in regex 2017-01-11 23:45:21 +00:00			`let glob = Glob::new(&at, ".", r"d[[:alpha:]][[:alpha:]]$");`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`RandomFile::new(&at, name).add_lines(10000);`
tests: normalize around chaining asserts Although for some tests this adds characters we still use them there because the brevity cost is now worth the benefit in terms of instant, natural-language readability and recognizability for people not familiar with this tests of this module or even the project 2016-08-13 21:59:21 +00:00			`ucmd.args(&["-l", "1000", name, "d"]).succeeds();`
rewrite tests for cargo compat, decoupled directory, output handling 2015-11-16 05:25:01 +00:00			`assert_eq!(glob.count(), 10);`
			`assert_eq!(glob.collate(), at.read(name).into_bytes());`
			`}`