use core::fmt;
pub use tag::{Tag, TagIterator, TagIteratorMut};
//mod query;
mod tag;
pub struct Html {
pub nodes: Vec,
}
impl Html {
pub fn parse>(raw: S) -> Self {
let mut raw = raw.as_ref();
let mut nodes = vec![];
loop {
let Consumed { node, remaining } = Self::parse_node(raw);
nodes.push(node);
match remaining {
None => break Self { nodes },
Some(rem) => raw = rem,
}
}
}
pub fn child_tags(&self) -> TagIterator {
TagIterator {
inner: self.nodes.iter(),
}
}
pub fn child_tags_mut(&mut self) -> TagIteratorMut {
TagIteratorMut {
inner: self.nodes.iter_mut(),
}
}
pub fn get_by_tag_name_mut(&mut self, looking: &str) -> Option<&mut Tag> {
// depth first
fn find_node<'a>(tag: &'a mut Tag, looking: &str) -> Option<&'a mut Tag> {
if tag.name.as_str() == looking {
return Some(tag);
}
for child in tag.child_tags_mut() {
if let Some(tag) = find_node(child, looking) {
return Some(tag);
}
}
None
}
for child in self.child_tags_mut() {
if let Some(tag) = find_node(child, looking) {
return Some(tag);
}
}
None
}
pub fn get_parent_that_contains_tag_name_mut(&mut self, looking: &str) -> Option<&mut Tag> {
// depth first
fn find_node<'a>(tag: &'a mut Tag, looking: &str) -> Option<&'a mut Tag> {
if tag.has_tag(looking) {
return Some(tag);
}
for child_tag in tag.child_tags_mut() {
if let Some(tag) = find_node(child_tag, looking) {
return Some(tag);
}
}
None
}
for child_tag in self.child_tags_mut() {
if let Some(tag) = find_node(child_tag, looking) {
return Some(tag);
}
}
None
}
pub fn get_by_id(&self, id: &str) -> Option<&Tag> {
// depth first
fn find_node<'a>(tag: &'a Tag, id: &str) -> Option<&'a Tag> {
if tag.id().unwrap_or_default() == id {
return Some(tag);
}
for child in tag.child_tags() {
if let Some(tag) = find_node(child, id) {
return Some(tag);
}
}
None
}
for child in self.child_tags() {
if let Some(tag) = find_node(child, id) {
return Some(tag);
}
}
None
}
fn parse_node(raw: &str) -> Consumed {
match Self::is_tag(raw) {
Some(_) => {
if let Some(cmt) = Self::parse_comment(raw) {
cmt
} else {
Self::parse_tag(raw)
}
}
None => {
let cons = Self::parse_text(raw);
cons
}
}
}
fn parse_tag(raw: &str) -> Consumed {
let (root_tag, mut rest) = Self::is_tag(raw).unwrap();
let mut tag = if root_tag.body.is_empty() {
Tag {
name: root_tag.name.to_owned(),
body: None,
self_closing: root_tag.self_closing,
children: vec![],
}
} else {
Tag {
name: root_tag.name.into(),
body: Some(root_tag.body.to_owned()),
self_closing: root_tag.self_closing,
children: vec![],
}
};
if root_tag.closing {
panic!(
"found closing tag when not expected! {:?}\n{raw}",
root_tag.name
)
} else if root_tag.self_closing {
return Consumed {
node: Node::Tag(tag),
remaining: rest,
};
}
loop {
// Special case ";
let special = Html::special_parse(basic, "script");
assert_eq!(special.unwrap().0, "words words\n");
assert!(special.unwrap().1.is_empty());
}
#[test]
fn special_parse_correctly_ignore_non_start() {
let nonstart = "first_line\nlet end = '';\n";
let special = Html::special_parse(nonstart, "script");
assert!(special.is_none());
}
#[test]
fn special_parse_correctly_handles_leading_whitespace() {
let white = "words words\n \t\t";
let special = Html::special_parse(white, "script");
assert_eq!(special.unwrap().0, "words words\n \t\t");
}
#[test]
fn parse_node_parses_comment() {
let cmt = "";
let node = Html::parse_node(cmt);
assert_eq!(node.node, comment!(" Comment! "));
}
#[test]
fn parse_node_parses_tag() {
let basic = "Hello!
";
let hh = Html::parse_node(basic);
assert_eq!(hh.node, tag!("p", [text!("Hello!")]))
}
#[test]
fn parse_node_parses_nested_tags() {
let nested = "Hello!
";
let hh = Html::parse_node(nested);
assert_eq!(hh.node, tag!("p", [tag!("p", [text!("Hello!")])]))
}
#[test]
fn parse_multiple_toplevel() {
let nested = "Hello
World!
";
let hh = Html::parse(nested);
assert_eq!(
hh.nodes,
vec![tag!("p", [text!("Hello ")]), tag!("p", [text!("World!")])]
)
}
#[test]
fn parse_script() {
let raw = "\n\t\n";
let hh = Html::parse(raw);
assert_eq!(
hh.nodes,
vec![tag!(
"head",
[
text!("\n\t"),
tag!("script", [text!("let k=\"v\";\n\t")]),
text!("\n")
]
)]
)
}
#[test]
fn parse_external_script() {
let raw = "\n\t\n";
let hh = Html::parse(raw);
assert_eq!(
hh.nodes,
vec![tag!(
"head",
[
text!("\n\t"),
tag!("script", "src=\"script.js\""),
text!("\n")
]
)]
)
}
fn test_roundtrip(raw: &str) {
let html = Html::parse(raw);
let string = html.to_string();
for (raw, html) in raw.lines().zip(string.lines()) {
assert_eq!(raw, html)
}
}
#[test]
fn round_trip_simple() {
test_roundtrip("Hello!
")
}
#[test]
fn round_trip_complex() {
test_roundtrip(
r#"
Title!
Hello, World!
"#,
)
}
}