use crate::tree::{NodeData, NodeRef};
use html5ever::serialize::TraversalScope::*;
use html5ever::serialize::{serialize, Serialize, SerializeOpts, Serializer, TraversalScope};
use html5ever::QualName;
use std::fmt;
use std::fs::File;
use std::io;
use std::io::Write;
use std::path::Path;
impl Serialize for NodeRef {
fn serialize<S: Serializer>(
&self,
serializer: &mut S,
traversal_scope: TraversalScope,
) -> io::Result<()> {
match (traversal_scope, self.data()) {
(ref scope, NodeData::Element(element)) => {
if *scope == IncludeNode {
let attrs = element.attributes.borrow();
let attrs = attrs
.map
.iter()
.map(|(name, attr)| {
(
QualName::new(
attr.prefix.clone(),
name.ns.clone(),
name.local.clone(),
),
&attr.value,
)
})
.collect::<Vec<_>>();
serializer.start_elem(
element.name.clone(),
attrs.iter().map(|&(ref name, value)| (name, &**value)),
)?
}
let children = match element.template_contents.as_ref() {
Some(template_root) => template_root.children(),
None => self.children(),
};
for child in children {
Serialize::serialize(&child, serializer, IncludeNode)?
}
if *scope == IncludeNode {
serializer.end_elem(element.name.clone())?
}
Ok(())
}
(_, &NodeData::DocumentFragment) | (_, &NodeData::Document(_)) => {
for child in self.children() {
Serialize::serialize(&child, serializer, IncludeNode)?
}
Ok(())
}
(ChildrenOnly(_), _) => Ok(()),
(IncludeNode, NodeData::Doctype(doctype)) => serializer.write_doctype(&doctype.name),
(IncludeNode, NodeData::Text(text)) => serializer.write_text(&text.borrow()),
(IncludeNode, NodeData::Comment(text)) => serializer.write_comment(&text.borrow()),
(IncludeNode, NodeData::ProcessingInstruction(contents)) => {
let contents = contents.borrow();
serializer.write_processing_instruction(&contents.0, &contents.1)
}
}
}
}
impl fmt::Display for NodeRef {
#[inline]
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
let mut bytes = Vec::new();
self.serialize(&mut bytes).or(Err(fmt::Error))?;
let html = String::from_utf8(bytes).or(Err(fmt::Error))?;
f.write_str(&html)
}
}
impl NodeRef {
#[inline]
pub fn serialize<W: Write>(&self, writer: &mut W) -> io::Result<()> {
serialize(
writer,
self,
SerializeOpts {
traversal_scope: IncludeNode,
..Default::default()
},
)
}
#[inline]
pub fn serialize_to_file<P: AsRef<Path>>(&self, path: P) -> io::Result<()> {
let mut file = File::create(&path)?;
self.serialize(&mut file)
}
}
#[cfg(test)]
mod tests {
use crate::parser::parse_html;
use crate::traits::*;
use tempfile::TempDir;
#[test]
fn serialize_and_read_file() {
let tempdir = TempDir::new().unwrap();
let mut path = tempdir.path().to_path_buf();
path.push("temp.html");
let html =
r"<!DOCTYPE html><html><head><title>Title</title></head><body>Body</body></html>";
let document = parse_html().one(html);
let _ = document.serialize_to_file(path.clone());
let document2 = parse_html().from_utf8().from_file(&path).unwrap();
assert_eq!(document.to_string(), document2.to_string());
}
#[test]
fn to_string() {
let html = r"<!DOCTYPE html>
<html>
<head>
<title>Test case</title>
</head>
<body>
<p class=foo>Foo
</body>
</html>";
let document = parse_html().one(html);
assert_eq!(
document
.inclusive_descendants()
.nth(11)
.unwrap()
.to_string(),
"<p class=\"foo\">Foo\n \n</p>"
);
}
#[test]
fn serialize_comment() {
let html = r"<div><!-- This is a comment --></div>";
let document = parse_html().one(html);
let output = document.to_string();
assert!(output.contains("<!-- This is a comment -->"));
}
#[test]
fn serialize_mixed_content() {
let html = r"<div>Text<!-- comment --><span>more</span></div>";
let document = parse_html().one(html);
let output = document.to_string();
assert!(output.contains("Text"));
assert!(output.contains("<!-- comment -->"));
assert!(output.contains("<span>"));
}
#[test]
fn serialize_to_writer() {
let html = r"<p>Hello</p>";
let document = parse_html().one(html);
let p = document.select_first("p").unwrap();
let mut buffer = Vec::new();
p.as_node().serialize(&mut buffer).unwrap();
let output = String::from_utf8(buffer).unwrap();
assert_eq!(output, "<p>Hello</p>");
}
}