X-Git-Url: http://git.scottworley.com/tablify/blobdiff_plain/1f6bd845277daaea2513cc3dc19a0907fe9f6d6c..58b5f36de045c760efa51b21a6d841f5b62558db:/src/lib.rs diff --git a/src/lib.rs b/src/lib.rs index 72a3add..fcf5dc8 100644 --- a/src/lib.rs +++ b/src/lib.rs @@ -1,4 +1,6 @@ #[cfg(test)] +use std::collections::{HashMap, HashSet}; +#[cfg(test)] use std::io::BufRead; #[cfg(test)] use std::iter::Iterator; @@ -10,13 +12,16 @@ struct RowInput { } struct Reader>> { - input: Input, + input: std::iter::Enumerate, row: Option, } impl>> Reader { #[cfg(test)] fn new(input: Input) -> Self { - Self { input, row: None } + Self { + input: input.enumerate(), + row: None, + } } } impl>> Iterator for Reader { @@ -26,19 +31,24 @@ impl>> Iterator for Reader match self .input .next() - .map(|r| r.map(|line| String::from(line.trim_end()))) + .map(|(n, r)| (n, r.map(|line| String::from(line.trim_end())))) { None => return Ok(std::mem::take(&mut self.row)).transpose(), - Some(Err(e)) => return Some(Err(e)), - Some(Ok(line)) if line.is_empty() && self.row.is_some() => { + Some((_, Err(e))) => return Some(Err(e)), + Some((_, Ok(line))) if line.is_empty() && self.row.is_some() => { return Ok(std::mem::take(&mut self.row)).transpose() } - Some(Ok(line)) if line.is_empty() => {} - Some(Ok(line)) if line.starts_with(' ') => match &mut self.row { - None => return Some(Err(std::io::Error::other("Entry with no header"))), + Some((_, Ok(line))) if line.is_empty() => {} + Some((n, Ok(line))) if line.starts_with(' ') => match &mut self.row { + None => { + return Some(Err(std::io::Error::other(format!( + "{}: Entry with no header", + n + 1 + )))) + } Some(ref mut row) => row.entries.push(String::from(line.trim())), }, - Some(Ok(line)) => { + Some((_, Ok(line))) => { let prev = std::mem::take(&mut self.row); self.row = Some(RowInput { label: line, @@ -58,6 +68,24 @@ fn read_rows(input: impl std::io::Read) -> impl Iterator Vec<(usize, String)> { + let mut counts: Vec<_> = rows + .iter() + .flat_map(|r| r.entries.iter().collect::>().into_iter()) + .fold(HashMap::new(), |mut cs, e| { + cs.entry(String::from(e)) + .and_modify(|n| *n += 1) + .or_insert(1); + cs + }) + .into_iter() + .map(|(col, n)| (n, col)) + .collect(); + counts.sort(); + counts +} + pub fn tablify(_input: &impl std::io::Read) -> String { String::from("Hello, world!") } @@ -153,10 +181,38 @@ mod tests { let bad = read_rows(&b" foo"[..]).next().unwrap(); assert!(bad.is_err()); - assert!(format!("{bad:?}").contains("Entry with no header")); + assert!(format!("{bad:?}").contains("1: Entry with no header")); let bad2 = read_rows(&b"foo\n\n bar"[..]).nth(1).unwrap(); assert!(bad2.is_err()); - assert!(format!("{bad2:?}").contains("Entry with no header")); + assert!(format!("{bad2:?}").contains("3: Entry with no header")); + } + + #[test] + fn test_column_counts() { + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n baz\n"[..]) + .collect::, _>>() + .unwrap() + ), + vec![(1, String::from("bar")), (1, String::from("baz"))] + ); + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n baz\nquux\n baz"[..]) + .collect::, _>>() + .unwrap() + ), + vec![(1, String::from("bar")), (2, String::from("baz"))] + ); + assert_eq!( + column_counts( + &read_rows(&b"foo\n bar\n bar\n baz\n bar\nquux\n baz"[..]) + .collect::, _>>() + .unwrap() + ), + vec![(1, String::from("bar")), (2, String::from("baz"))] + ); } }