diff --git a/src/html/mod.rs b/src/html/mod.rs
index 83999b3..fa08ddc 100644
--- a/src/html/mod.rs
+++ b/src/html/mod.rs
@@ -30,39 +30,54 @@ pub fn escape_html>(s: &S) -> Cow<'_, str> {
encode_text_minimal(s)
}
-#[derive(Clone, Debug)]
+fn count_digits(n: u16) -> u8 {
+ f32::log10(n.into()).floor() as u8 + 1
+}
+
+#[derive(Clone, Debug, Default)]
+enum ListState {
+ #[default]
+ None,
+ Unordered,
+ Ordered {
+ counter: u16,
+ digits: u8,
+ },
+}
+
+#[derive(Clone, Debug, Default)]
struct FormatState {
style: Style,
padding: String,
+ list_state: ListState,
}
fn format_tree(
tree: Rc,
- state: FormatState,
+ state: &mut FormatState,
text: &mut Text<'static>,
mut previous_sibling_is_block: bool,
) -> bool {
use markup5ever_rcdom::NodeData::*;
- let state = match &tree.data {
- Document | Doctype { .. } | Comment { .. } | ProcessingInstruction { .. } => state,
+ let mut state = match &tree.data {
+ Document | Doctype { .. } | Comment { .. } | ProcessingInstruction { .. } => state.to_owned(),
Text { contents } => {
let s: String = contents.clone().into_inner().into();
let s = s.replace('\n', ""); // Lines are insignificant in HTML
if previous_sibling_is_block && !s.is_empty() {
text.lines.push(Line {
- spans: vec![Span {
- content: Cow::Owned(state.padding.to_owned()),
- style: state.style,
- }],
+ spans: vec![Span::styled(state.padding.to_owned(), state.style)],
alignment: None,
});
previous_sibling_is_block = false;
}
- text.lines.last_mut().unwrap().spans.push(Span {
- content: Cow::Owned(s.to_owned()),
- style: state.style,
- });
- state
+ text
+ .lines
+ .last_mut()
+ .unwrap()
+ .spans
+ .push(Span::styled(s, state.style));
+ state.to_owned()
},
Element {
name: QualName {
@@ -75,43 +90,116 @@ fn format_tree(
} => match name.as_ref() {
"br" => {
text.lines.push(Line::raw(state.padding.to_owned()));
- state
+ state.to_owned()
},
"p" => {
previous_sibling_is_block = true;
- state
+ state.to_owned()
},
"blockquote" => {
previous_sibling_is_block = true;
FormatState {
- padding: state.padding + "> ",
- ..state
+ padding: state.padding.to_owned() + "> ",
+ ..state.to_owned()
+ }
+ },
+ "ul" => {
+ previous_sibling_is_block = true;
+ FormatState {
+ list_state: ListState::Unordered,
+ ..state.to_owned()
+ }
+ },
+ "ol" => {
+ previous_sibling_is_block = true;
+ // FIXME: are not guaranteed to be direct children, are they?
+ let items_count: u16 = tree
+ .children
+ .borrow()
+ .iter()
+ .map(|child| match &child.data {
+ Element {
+ name:
+ QualName {
+ ns: ns!(html),
+ local,
+ ..
+ },
+ ..
+ } if local.as_ref() == "li" => 1,
+ _ => 0,
+ })
+ .sum();
+ FormatState {
+ list_state: ListState::Ordered {
+ counter: 0,
+ digits: count_digits(items_count),
+ },
+ ..state.to_owned()
+ }
+ },
+ "li" => {
+ previous_sibling_is_block = false;
+ match state.list_state {
+ ListState::None => state.to_owned(),
+ ListState::Unordered => {
+ let mut line = Line::default();
+ line
+ .spans
+ .push(Span::styled(state.padding.to_owned(), state.style));
+ line.spans.push(Span::styled("* ", state.style));
+ text.lines.push(line);
+ FormatState {
+ padding: state.padding.to_owned() + " ",
+ ..state.to_owned()
+ }
+ },
+ ListState::Ordered {
+ ref mut counter,
+ digits,
+ } => {
+ let mut line = Line::default();
+ line
+ .spans
+ .push(Span::styled(state.padding.to_owned(), state.style));
+ *counter += 1;
+ line
+ .spans
+ .push(Span::styled(format!("{}. ", counter), state.style));
+ if count_digits(*counter) != digits {
+ line.spans.push(Span::styled(
+ " ".repeat((digits - count_digits(*counter)).into()),
+ state.style,
+ ));
+ }
+ text.lines.push(line);
+ FormatState {
+ padding: state.padding.to_owned() + " " + &" ".repeat(digits.into()),
+ ..state.to_owned()
+ }
+ },
}
},
"em" | "i" => FormatState {
style: state.style.italic(),
- ..state
+ ..state.to_owned()
},
"strong" | "b" => FormatState {
style: state.style.bold(),
- ..state
+ ..state.to_owned()
},
"u" => FormatState {
style: state.style.underlined(),
- ..state
+ ..state.to_owned()
},
- _ => state,
+ _ => state.to_owned(),
},
- Element { .. } => state, // Element not in the HTML namespace
+ Element { .. } => state.to_owned(), // Element not in the HTML namespace
};
for subtree in tree.children.borrow().iter() {
- previous_sibling_is_block = format_tree(
- subtree.clone(),
- state.clone(),
- text,
- previous_sibling_is_block,
- );
+ previous_sibling_is_block =
+ format_tree(subtree.clone(), &mut state, text, previous_sibling_is_block);
}
match &tree.data {
@@ -146,11 +234,11 @@ pub fn format_html(s: &str) -> Text<'static> {
)
.one(s)
.document;
- let state = FormatState {
- style: Style::default(),
+ let mut state = FormatState {
padding: " ".to_owned(),
+ ..Default::default()
};
let mut text = Text::raw("");
- format_tree(tree, state, &mut text, false);
+ format_tree(tree, &mut state, &mut text, false);
text
}