X-Git-Url: http://git.scottworley.com/tablify/blobdiff_plain/ece97615567c7bc537f960d1784d652b11c0e66c..397ef957e293901c2945f815e585474608fe2c9d:/src/lib.rs diff --git a/src/lib.rs b/src/lib.rs index 820f43e..c7271f3 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -1,3 +1,213 @@ +#[cfg(test)] +use std::collections::{HashMap, HashSet}; +#[cfg(test)] +use std::io::BufRead; +#[cfg(test)] +use std::iter::Iterator; + +#[derive(Debug, PartialEq, Eq)] +struct RowInput { + label: String, + entries: Vec, +} + +struct Reader>> { + input: std::iter::Enumerate, + row: Option, +} +impl>> Reader { + #[cfg(test)] + fn new(input: Input) -> Self { + Self { + input: input.enumerate(), + row: None, + } + } +} +impl>> Iterator for Reader { + type Item = Result; + fn next(&mut self) -> Option { + loop { + match self + .input + .next() + .map(|(n, r)| (n, r.map(|line| String::from(line.trim_end())))) + { + None => return Ok(std::mem::take(&mut self.row)).transpose(), + Some((_, Err(e))) => return Some(Err(e)), + Some((_, Ok(line))) if line.is_empty() && self.row.is_some() => { + return Ok(std::mem::take(&mut self.row)).transpose() + } + Some((_, Ok(line))) if line.is_empty() => {} + Some((n, Ok(line))) if line.starts_with(' ') => match &mut self.row { + None => { + return Some(Err(std::io::Error::other(format!( + "{}: Entry with no header", + n + 1 + )))) + } + Some(ref mut row) => row.entries.push(String::from(line.trim())), + }, + Some((_, Ok(line))) => { + let prev = std::mem::take(&mut self.row); + self.row = Some(RowInput { + label: line, + entries: vec![], + }); + if prev.is_some() { + return Ok(prev).transpose(); + } + } + } + } + } +} + +#[cfg(test)] +fn read_rows(input: impl std::io::Read) -> impl Iterator> { + Reader::new(std::io::BufReader::new(input).lines()) +} + +#[cfg(test)] +fn column_counts(rows: &[RowInput]) -> HashMap { + rows.iter() + .flat_map(|r| r.entries.iter().collect::>().into_iter()) + .fold(HashMap::new(), |mut counts, e| { + counts + .entry(String::from(e)) + .and_modify(|c| *c += 1) + .or_insert(1); + counts + }) +} + pub fn tablify(_input: &impl std::io::Read) -> String { String::from("Hello, world!") } + +#[cfg(test)] +mod tests { + use super::*; + + #[test] + fn test_read_rows() { + assert_eq!( + read_rows(&b"foo"[..]).flatten().collect::>(), + vec![RowInput { + label: String::from("foo"), + entries: vec![] + }] + ); + assert_eq!( + read_rows(&b"bar"[..]).flatten().collect::>(), + vec![RowInput { + label: String::from("bar"), + entries: vec![] + }] + ); + assert_eq!( + read_rows(&b"foo\nbar\n"[..]).flatten().collect::>(), + vec![ + RowInput { + label: String::from("foo"), + entries: vec![] + }, + RowInput { + label: String::from("bar"), + entries: vec![] + } + ] + ); + assert_eq!( + read_rows(&b"foo\n bar\n"[..]).flatten().collect::>(), + vec![RowInput { + label: String::from("foo"), + entries: vec![String::from("bar")] + }] + ); + assert_eq!( + read_rows(&b"foo\n bar\n baz\n"[..]) + .flatten() + .collect::>(), + vec![RowInput { + label: String::from("foo"), + entries: vec![String::from("bar"), String::from("baz")] + }] + ); + assert_eq!( + read_rows(&b"foo\n\nbar\n"[..]) + .flatten() + .collect::>(), + vec![ + RowInput { + label: String::from("foo"), + entries: vec![] + }, + RowInput { + label: String::from("bar"), + entries: vec![] + } + ] + ); + assert_eq!( + read_rows(&b"foo\n \nbar\n"[..]) + .flatten() + .collect::>(), + vec![ + RowInput { + label: String::from("foo"), + entries: vec![] + }, + RowInput { + label: String::from("bar"), + entries: vec![] + } + ] + ); + assert_eq!( + read_rows(&b"foo \n bar \n"[..]) + .flatten() + .collect::>(), + vec![RowInput { + label: String::from("foo"), + entries: vec![String::from("bar")] + }] + ); + + let bad = read_rows(&b" foo"[..]).next().unwrap(); + assert!(bad.is_err()); + assert!(format!("{bad:?}").contains("1: Entry with no header")); + + let bad2 = read_rows(&b"foo\n\n bar"[..]).nth(1).unwrap(); + assert!(bad2.is_err()); + assert!(format!("{bad2:?}").contains("3: Entry with no header")); + } + + #[test] + fn test_column_counts() { + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n baz\n"[..]) + .collect::, _>>() + .unwrap() + ), + HashMap::from([(String::from("bar"), 1), (String::from("baz"), 1)]) + ); + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n baz\nquux\n baz"[..]) + .collect::, _>>() + .unwrap() + ), + HashMap::from([(String::from("bar"), 1), (String::from("baz"), 2)]) + ); + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n bar\n baz\n bar\nquux\n baz"[..]) + .collect::, _>>() + .unwrap() + ), + HashMap::from([(String::from("bar"), 1), (String::from("baz"), 2)]) + ); + } +}