X-Git-Url: http://git.scottworley.com/tablify/blobdiff_plain/f272e502c4d1e2e33ab1e9fe460df69ff8f8ccd2..12e913005080a9f60750d807c220a58704429361:/src/lib.rs
diff --git a/src/lib.rs b/src/lib.rs
index e90f66b..dbcfc7b 100644
--- a/src/lib.rs
+++ b/src/lib.rs
@@ -1,22 +1,126 @@
-#[cfg(test)]
+use std::borrow::ToOwned;
use std::collections::HashMap;
-#[cfg(test)]
+use std::fmt::Write;
use std::io::BufRead;
-#[cfg(test)]
use std::iter::Iterator;
+pub struct Config {
+ pub column_threshold: usize,
+}
+
+const HEADER: &str = r#"
+
+
+
+
+
+
+
+
+
+
+"#;
+const FOOTER: &str = "
+
+
+";
+
+#[derive(PartialEq, Eq, Debug)]
+pub struct HTML(String);
+impl HTML {
+ fn escape(value: &str) -> HTML {
+ let mut escaped: String = String::new();
+ for c in value.chars() {
+ match c {
+ '>' => escaped.push_str(">"),
+ '<' => escaped.push_str("<"),
+ '\'' => escaped.push_str("'"),
+ '"' => escaped.push_str("""),
+ '&' => escaped.push_str("&"),
+ ok_c => escaped.push(ok_c),
+ }
+ }
+ HTML(escaped)
+ }
+}
+impl From<&str> for HTML {
+ fn from(value: &str) -> HTML {
+ HTML(String::from(value))
+ }
+}
+impl FromIterator for HTML {
+ fn from_iter(iter: T) -> HTML
+ where
+ T: IntoIterator- ,
+ {
+ HTML(iter.into_iter().map(|html| html.0).collect::())
+ }
+}
+impl std::fmt::Display for HTML {
+ fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
+ write!(f, "{}", self.0)
+ }
+}
+
#[derive(Debug, PartialEq, Eq)]
-struct RowInput {
+enum InputLine<'a> {
+ Blank,
+ RowHeader(&'a str),
+ Entry(&'a str, Option<&'a str>),
+}
+impl<'a> From<&'a str> for InputLine<'a> {
+ fn from(value: &'a str) -> InputLine<'a> {
+ let trimmed = value.trim_end();
+ if trimmed.is_empty() {
+ InputLine::Blank
+ } else if !trimmed.starts_with(' ') {
+ InputLine::RowHeader(value.trim())
+ } else {
+ match value.split_once(':') {
+ None => InputLine::Entry(value.trim(), None),
+ Some((col, instance)) => InputLine::Entry(col.trim(), Some(instance.trim())),
+ }
+ }
+ }
+}
+
+#[derive(Debug, PartialEq, Eq)]
+struct Row {
label: String,
- entries: Vec,
+ entries: HashMap>>,
+}
+
+#[derive(Debug, PartialEq, Eq)]
+enum Rowlike {
+ Row(Row),
+ Spacer,
}
struct Reader>> {
input: std::iter::Enumerate,
- row: Option,
+ row: Option
,
}
impl>> Reader {
- #[cfg(test)]
fn new(input: Input) -> Self {
Self {
input: input.enumerate(),
@@ -25,181 +129,512 @@ impl>> Reader {
}
}
impl>> Iterator for Reader {
- type Item = Result;
+ type Item = Result;
fn next(&mut self) -> Option {
loop {
- match self
- .input
- .next()
- .map(|(n, r)| (n, r.map(|line| String::from(line.trim_end()))))
- {
- None => return Ok(std::mem::take(&mut self.row)).transpose(),
+ match self.input.next() {
+ None => return Ok(std::mem::take(&mut self.row).map(Rowlike::Row)).transpose(),
Some((_, Err(e))) => return Some(Err(e)),
- Some((_, Ok(line))) if line.is_empty() && self.row.is_some() => {
- return Ok(std::mem::take(&mut self.row)).transpose()
- }
- Some((_, Ok(line))) if line.is_empty() => {}
- Some((n, Ok(line))) if line.starts_with(' ') => match &mut self.row {
- None => {
- return Some(Err(std::io::Error::other(format!(
- "{}: Entry with no header",
- n + 1
- ))))
+ Some((n, Ok(line))) => match InputLine::from(line.as_ref()) {
+ InputLine::Blank if self.row.is_some() => {
+ return Ok(std::mem::take(&mut self.row).map(Rowlike::Row)).transpose()
}
- Some(ref mut row) => row.entries.push(String::from(line.trim())),
- },
- Some((_, Ok(line))) => {
- let prev = std::mem::take(&mut self.row);
- self.row = Some(RowInput {
- label: line,
- entries: vec![],
- });
- if prev.is_some() {
- return Ok(prev).transpose();
+ InputLine::Blank => return Some(Ok(Rowlike::Spacer)),
+ InputLine::Entry(col, instance) => match &mut self.row {
+ None => {
+ return Some(Err(std::io::Error::other(format!(
+ "{}: Entry with no header",
+ n + 1
+ ))))
+ }
+ Some(ref mut row) => {
+ row.entries
+ .entry(col.to_owned())
+ .and_modify(|is| is.push(instance.map(ToOwned::to_owned)))
+ .or_insert_with(|| vec![instance.map(ToOwned::to_owned)]);
+ }
+ },
+ InputLine::RowHeader(row) => {
+ let prev = std::mem::take(&mut self.row);
+ self.row = Some(Row {
+ label: row.to_owned(),
+ entries: HashMap::new(),
+ });
+ if prev.is_some() {
+ return Ok(prev.map(Rowlike::Row)).transpose();
+ }
}
- }
+ },
}
}
}
}
-#[cfg(test)]
-fn read_rows(input: impl std::io::Read) -> impl Iterator- > {
- Reader::new(std::io::BufReader::new(input).lines())
+fn read_rows(input: impl std::io::Read) -> Result, std::io::Error> {
+ Reader::new(std::io::BufReader::new(input).lines()).collect::, _>>()
}
-#[cfg(test)]
-fn column_counts(rows: &[RowInput]) -> HashMap {
- rows.iter()
- .flat_map(|r| r.entries.iter())
- .fold(HashMap::new(), |mut counts, e| {
- counts
- .entry(String::from(e))
- .and_modify(|c| *c += 1)
+fn column_counts(rows: &[Rowlike]) -> Vec<(usize, String)> {
+ let empty = HashMap::new();
+ let mut counts: Vec<_> = rows
+ .iter()
+ .flat_map(|rl| match rl {
+ Rowlike::Row(r) => r.entries.keys(),
+ Rowlike::Spacer => empty.keys(),
+ })
+ .fold(HashMap::new(), |mut cs, col| {
+ cs.entry(col.to_owned())
+ .and_modify(|n| *n += 1)
.or_insert(1);
- counts
+ cs
})
+ .into_iter()
+ .map(|(col, n)| (n, col))
+ .collect();
+ counts.sort_unstable_by(|(an, acol), (bn, bcol)| bn.cmp(an).then(acol.cmp(bcol)));
+ counts
+}
+fn column_order(config: &Config, rows: &[Rowlike]) -> Vec {
+ column_counts(rows)
+ .into_iter()
+ .filter_map(|(n, col)| (n >= config.column_threshold).then_some(col))
+ .collect()
+}
+
+fn render_one_instance(instance: &Option) -> HTML {
+ match instance {
+ None => HTML::from("â"),
+ Some(instance) => HTML::escape(instance.as_ref()),
+ }
}
-pub fn tablify(_input: &impl std::io::Read) -> String {
- String::from("Hello, world!")
+fn render_instances(instances: &[Option]) -> HTML {
+ let all_empty = instances.iter().all(Option::is_none);
+ if all_empty && instances.len() == 1 {
+ HTML::from("")
+ } else if all_empty {
+ HTML(format!("{}", instances.len()))
+ } else {
+ HTML(
+ instances
+ .iter()
+ .map(render_one_instance)
+ .map(|html| html.0) // Waiting for slice_concat_trait to stabilize
+ .collect::>()
+ .join(" "),
+ )
+ }
+}
+
+fn render_cell(col: &str, row: &mut Row) -> HTML {
+ let row_label = HTML::escape(row.label.as_ref());
+ let col_label = HTML::escape(col);
+ let instances: Option<&Vec