use std::borrow::Cow;
use std::io::Write;
use std::result::Result as StdResult;
use crate::encoding::UTF8_BOM;
use crate::errors::{Error, Result};
use crate::events::{attributes::Attribute, BytesCData, BytesStart, BytesText, Event};
#[cfg(feature = "async-tokio")]
mod async_tokio;
#[cfg(feature = "serialize")]
use {crate::de::DeError, serde::Serialize};
#[derive(Clone)]
pub struct Writer<W> {
writer: W,
indent: Option<Indentation>,
}
impl<W> Writer<W> {
pub fn new(inner: W) -> Writer<W> {
Writer {
writer: inner,
indent: None,
}
}
pub fn new_with_indent(inner: W, indent_char: u8, indent_size: usize) -> Writer<W> {
Writer {
writer: inner,
indent: Some(Indentation::new(indent_char, indent_size)),
}
}
pub fn into_inner(self) -> W {
self.writer
}
pub fn get_mut(&mut self) -> &mut W {
&mut self.writer
}
pub fn get_ref(&self) -> &W {
&self.writer
}
#[must_use]
pub fn create_element<'a, N>(&'a mut self, name: N) -> ElementWriter<W>
where
N: Into<Cow<'a, str>>,
{
ElementWriter {
writer: self,
start_tag: BytesStart::new(name),
state: AttributeIndent::NoneAttributesWritten,
spaces: Vec::new(),
}
}
}
impl<W: Write> Writer<W> {
pub fn write_bom(&mut self) -> Result<()> {
self.write(UTF8_BOM)
}
pub fn write_event<'a, E: AsRef<Event<'a>>>(&mut self, event: E) -> Result<()> {
let mut next_should_line_break = true;
let result = match *event.as_ref() {
Event::Start(ref e) => {
let result = self.write_wrapped(b"<", e, b">");
if let Some(i) = self.indent.as_mut() {
i.grow();
}
result
}
Event::End(ref e) => {
if let Some(i) = self.indent.as_mut() {
i.shrink();
}
self.write_wrapped(b"</", e, b">")
}
Event::Empty(ref e) => self.write_wrapped(b"<", e, b"/>"),
Event::Text(ref e) => {
next_should_line_break = false;
self.write(e)
}
Event::Comment(ref e) => self.write_wrapped(b"<!--", e, b"-->"),
Event::CData(ref e) => {
next_should_line_break = false;
self.write(b"<![CDATA[")?;
self.write(e)?;
self.write(b"]]>")
}
Event::Decl(ref e) => self.write_wrapped(b"<?", e, b"?>"),
Event::PI(ref e) => self.write_wrapped(b"<?", e, b"?>"),
Event::DocType(ref e) => self.write_wrapped(b"<!DOCTYPE ", e, b">"),
Event::Eof => Ok(()),
};
if let Some(i) = self.indent.as_mut() {
i.should_line_break = next_should_line_break;
}
result
}
#[inline]
pub(crate) fn write(&mut self, value: &[u8]) -> Result<()> {
self.writer.write_all(value).map_err(Into::into)
}
#[inline]
fn write_wrapped(&mut self, before: &[u8], value: &[u8], after: &[u8]) -> Result<()> {
if let Some(ref i) = self.indent {
if i.should_line_break {
self.writer.write_all(b"\n")?;
self.writer.write_all(i.current())?;
}
}
self.write(before)?;
self.write(value)?;
self.write(after)?;
Ok(())
}
pub fn write_indent(&mut self) -> Result<()> {
if let Some(ref i) = self.indent {
self.writer.write_all(b"\n")?;
self.writer.write_all(i.current())?;
}
Ok(())
}
#[cfg(feature = "serialize")]
pub fn write_serializable<T: Serialize>(
&mut self,
tag_name: &str,
content: &T,
) -> std::result::Result<(), DeError> {
use crate::se::{Indent, Serializer};
self.write_indent()?;
let mut fmt = ToFmtWrite(&mut self.writer);
let mut serializer = Serializer::with_root(&mut fmt, Some(tag_name))?;
if let Some(indent) = &mut self.indent {
serializer.set_indent(Indent::Borrow(indent));
}
content.serialize(serializer)?;
Ok(())
}
}
#[derive(Debug)]
enum AttributeIndent {
NoneAttributesWritten,
WriteSpaces(usize),
Spaces(usize),
WriteConfigured(usize),
Configured(usize),
}
pub struct ElementWriter<'a, W> {
writer: &'a mut Writer<W>,
start_tag: BytesStart<'a>,
state: AttributeIndent,
spaces: Vec<u8>,
}
impl<'a, W> ElementWriter<'a, W> {
pub fn with_attribute<'b, I>(mut self, attr: I) -> Self
where
I: Into<Attribute<'b>>,
{
self.write_attr(attr.into());
self
}
pub fn with_attributes<'b, I>(mut self, attributes: I) -> Self
where
I: IntoIterator,
I::Item: Into<Attribute<'b>>,
{
let mut iter = attributes.into_iter();
if let Some(attr) = iter.next() {
self.write_attr(attr.into());
self.start_tag.extend_attributes(iter);
}
self
}
pub fn new_line(mut self) -> Self {
if let Some(i) = self.writer.indent.as_mut() {
match self.state {
AttributeIndent::NoneAttributesWritten => {
self.state = AttributeIndent::WriteConfigured(i.indent_size)
}
AttributeIndent::WriteSpaces(_) => {}
AttributeIndent::Spaces(indent) => {
self.state = AttributeIndent::WriteSpaces(indent)
}
AttributeIndent::WriteConfigured(_) => {}
AttributeIndent::Configured(indent) => {
self.state = AttributeIndent::WriteConfigured(indent)
}
}
self.start_tag.push_newline();
};
self
}
fn write_attr<'b>(&mut self, attr: Attribute<'b>) {
if let Some(i) = self.writer.indent.as_mut() {
self.state = match self.state {
AttributeIndent::NoneAttributesWritten => {
self.start_tag.push_attribute(attr);
AttributeIndent::Spaces(self.start_tag.name().as_ref().len() + 2)
}
AttributeIndent::WriteSpaces(indent) => {
if self.spaces.len() < indent {
self.spaces.resize(indent, b' ');
}
self.start_tag.push_indent(&self.spaces[..indent]);
self.start_tag.push_attr(attr.into());
AttributeIndent::Spaces(indent)
}
AttributeIndent::Spaces(indent) => {
self.start_tag.push_attribute(attr);
AttributeIndent::Spaces(indent)
}
AttributeIndent::WriteConfigured(indent) => {
self.start_tag.push_indent(i.additional(indent));
self.start_tag.push_attr(attr.into());
AttributeIndent::Configured(indent)
}
AttributeIndent::Configured(indent) => {
self.start_tag.push_attribute(attr);
AttributeIndent::Configured(indent)
}
};
} else {
self.start_tag.push_attribute(attr);
}
}
}
impl<'a, W: Write> ElementWriter<'a, W> {
pub fn write_text_content(self, text: BytesText) -> Result<&'a mut Writer<W>> {
self.writer
.write_event(Event::Start(self.start_tag.borrow()))?;
self.writer.write_event(Event::Text(text))?;
self.writer
.write_event(Event::End(self.start_tag.to_end()))?;
Ok(self.writer)
}
pub fn write_cdata_content(self, text: BytesCData) -> Result<&'a mut Writer<W>> {
self.writer
.write_event(Event::Start(self.start_tag.borrow()))?;
self.writer.write_event(Event::CData(text))?;
self.writer
.write_event(Event::End(self.start_tag.to_end()))?;
Ok(self.writer)
}
pub fn write_pi_content(self, text: BytesText) -> Result<&'a mut Writer<W>> {
self.writer
.write_event(Event::Start(self.start_tag.borrow()))?;
self.writer.write_event(Event::PI(text))?;
self.writer
.write_event(Event::End(self.start_tag.to_end()))?;
Ok(self.writer)
}
pub fn write_empty(self) -> Result<&'a mut Writer<W>> {
self.writer.write_event(Event::Empty(self.start_tag))?;
Ok(self.writer)
}
pub fn write_inner_content<F, E>(self, closure: F) -> StdResult<&'a mut Writer<W>, E>
where
F: FnOnce(&mut Writer<W>) -> StdResult<(), E>,
E: From<Error>,
{
self.writer
.write_event(Event::Start(self.start_tag.borrow()))?;
closure(self.writer)?;
self.writer
.write_event(Event::End(self.start_tag.to_end()))?;
Ok(self.writer)
}
}
#[cfg(feature = "serialize")]
struct ToFmtWrite<T>(pub T);
#[cfg(feature = "serialize")]
impl<T> std::fmt::Write for ToFmtWrite<T>
where
T: std::io::Write,
{
fn write_str(&mut self, s: &str) -> std::fmt::Result {
self.0.write_all(s.as_bytes()).map_err(|_| std::fmt::Error)
}
}
#[derive(Clone)]
pub(crate) struct Indentation {
should_line_break: bool,
indent_char: u8,
indent_size: usize,
indents: Vec<u8>,
current_indent_len: usize,
}
impl Indentation {
pub fn new(indent_char: u8, indent_size: usize) -> Self {
Self {
should_line_break: false,
indent_char,
indent_size,
indents: vec![indent_char; 128],
current_indent_len: 0, }
}
pub fn grow(&mut self) {
self.current_indent_len += self.indent_size;
self.ensure(self.current_indent_len);
}
pub fn shrink(&mut self) {
self.current_indent_len = self.current_indent_len.saturating_sub(self.indent_size);
}
pub fn current(&self) -> &[u8] {
&self.indents[..self.current_indent_len]
}
pub fn additional(&mut self, additional_indent: usize) -> &[u8] {
let new_len = self.current_indent_len + additional_indent;
self.ensure(new_len);
&self.indents[..new_len]
}
fn ensure(&mut self, new_len: usize) {
if self.indents.len() < new_len {
self.indents.resize(new_len, self.indent_char);
}
}
}
#[cfg(test)]
mod indentation {
use super::*;
use crate::events::*;
use pretty_assertions::assert_eq;
#[test]
fn self_closed() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let tag = BytesStart::new("self-closed")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
writer
.write_event(Event::Empty(tag))
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<self-closed attr1="value1" attr2="value2"/>"#
);
}
#[test]
fn empty_paired() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
writer
.write_event(Event::Start(start.clone()))
.expect("write start tag failed");
writer
.write_event(Event::End(end))
.expect("write end tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">
</paired>"#
);
}
#[test]
fn paired_with_inner() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
let inner = BytesStart::new("inner");
writer
.write_event(Event::Start(start.clone()))
.expect("write start tag failed");
writer
.write_event(Event::Empty(inner))
.expect("write inner tag failed");
writer
.write_event(Event::End(end))
.expect("write end tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">
<inner/>
</paired>"#
);
}
#[test]
fn paired_with_text() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
let text = BytesText::new("text");
writer
.write_event(Event::Start(start.clone()))
.expect("write start tag failed");
writer
.write_event(Event::Text(text))
.expect("write text failed");
writer
.write_event(Event::End(end))
.expect("write end tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">text</paired>"#
);
}
#[test]
fn mixed_content() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
let text = BytesText::new("text");
let inner = BytesStart::new("inner");
writer
.write_event(Event::Start(start.clone()))
.expect("write start tag failed");
writer
.write_event(Event::Text(text))
.expect("write text failed");
writer
.write_event(Event::Empty(inner))
.expect("write inner tag failed");
writer
.write_event(Event::End(end))
.expect("write end tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">text<inner/>
</paired>"#
);
}
#[test]
fn nested() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
let inner = BytesStart::new("inner");
writer
.write_event(Event::Start(start.clone()))
.expect("write start 1 tag failed");
writer
.write_event(Event::Start(start.clone()))
.expect("write start 2 tag failed");
writer
.write_event(Event::Empty(inner))
.expect("write inner tag failed");
writer
.write_event(Event::End(end.clone()))
.expect("write end tag 2 failed");
writer
.write_event(Event::End(end))
.expect("write end tag 1 failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">
<paired attr1="value1" attr2="value2">
<inner/>
</paired>
</paired>"#
);
}
#[cfg(feature = "serialize")]
#[test]
fn serializable() {
#[derive(Serialize)]
struct Foo {
#[serde(rename = "@attribute")]
attribute: &'static str,
element: Bar,
list: Vec<&'static str>,
#[serde(rename = "$text")]
text: &'static str,
val: String,
}
#[derive(Serialize)]
struct Bar {
baz: usize,
bat: usize,
}
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
let content = Foo {
attribute: "attribute",
element: Bar { baz: 42, bat: 43 },
list: vec!["first element", "second element"],
text: "text",
val: "foo".to_owned(),
};
let start = BytesStart::new("paired")
.with_attributes(vec![("attr1", "value1"), ("attr2", "value2")].into_iter());
let end = start.to_end();
writer
.write_event(Event::Start(start.clone()))
.expect("write start tag failed");
writer
.write_serializable("foo_element", &content)
.expect("write serializable inner contents failed");
writer
.write_event(Event::End(end))
.expect("write end tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">
<foo_element attribute="attribute">
<element>
<baz>42</baz>
<bat>43</bat>
</element>
<list>first element</list>
<list>second element</list>
text
<val>foo</val>
</foo_element>
</paired>"#
);
}
#[test]
fn element_writer_empty() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
writer
.create_element("empty")
.with_attribute(("attr1", "value1"))
.with_attribute(("attr2", "value2"))
.write_empty()
.expect("failure");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<empty attr1="value1" attr2="value2"/>"#
);
}
#[test]
fn element_writer_text() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
writer
.create_element("paired")
.with_attribute(("attr1", "value1"))
.with_attribute(("attr2", "value2"))
.write_text_content(BytesText::new("text"))
.expect("failure");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<paired attr1="value1" attr2="value2">text</paired>"#
);
}
#[test]
fn element_writer_nested() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b' ', 4);
writer
.create_element("outer")
.with_attribute(("attr1", "value1"))
.with_attribute(("attr2", "value2"))
.write_inner_content::<_, Error>(|writer| {
let fruits = ["apple", "orange", "banana"];
for (quant, item) in fruits.iter().enumerate() {
writer
.create_element("fruit")
.with_attribute(("quantity", quant.to_string().as_str()))
.write_text_content(BytesText::new(item))?;
}
writer
.create_element("inner")
.write_inner_content(|writer| {
writer.create_element("empty").write_empty().map(|_| ())
})?;
Ok(())
})
.expect("failure");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<outer attr1="value1" attr2="value2">
<fruit quantity="0">apple</fruit>
<fruit quantity="1">orange</fruit>
<fruit quantity="2">banana</fruit>
<inner>
<empty/>
</inner>
</outer>"#
);
}
mod in_attributes {
use super::*;
use pretty_assertions::assert_eq;
#[test]
fn newline_first() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.new_line()
.with_attribute(("first", "1"))
.with_attribute(("second", "2"))
.new_line()
.with_attribute(("third", "3"))
.with_attribute(("fourth", "4"))
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
"<element\
\n_first=\"1\" second=\"2\"\
\n_third=\"3\" fourth=\"4\"/>"
);
}
#[test]
fn newline_inside() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.with_attribute(("first", "1"))
.with_attribute(("second", "2"))
.new_line()
.with_attribute(("third", "3"))
.with_attribute(("fourth", "4"))
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
"<element first=\"1\" second=\"2\"\
\n third=\"3\" fourth=\"4\"/>"
);
}
#[test]
fn newline_last() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.new_line()
.with_attribute(("first", "1"))
.with_attribute(("second", "2"))
.new_line()
.with_attribute(("third", "3"))
.with_attribute(("fourth", "4"))
.new_line()
.write_empty()
.expect("write tag failed");
writer
.create_element("element")
.with_attribute(("first", "1"))
.with_attribute(("second", "2"))
.new_line()
.with_attribute(("third", "3"))
.with_attribute(("fourth", "4"))
.new_line()
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
"<element\
\n_first=\"1\" second=\"2\"\
\n_third=\"3\" fourth=\"4\"\
\n/>\
\n<element first=\"1\" second=\"2\"\
\n third=\"3\" fourth=\"4\"\
\n/>"
);
}
#[test]
fn newline_twice() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.new_line()
.new_line()
.write_empty()
.expect("write tag failed");
writer
.create_element("element")
.with_attribute(("first", "1"))
.new_line()
.new_line()
.with_attribute(("second", "2"))
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<element
/>
<element first="1"
second="2"/>"#
);
}
#[test]
fn without_indent() {
let mut buffer = Vec::new();
let mut writer = Writer::new(&mut buffer);
writer
.create_element("element")
.new_line()
.new_line()
.write_empty()
.expect("write tag failed");
writer
.create_element("element")
.with_attribute(("first", "1"))
.new_line()
.new_line()
.with_attribute(("second", "2"))
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<element/><element first="1" second="2"/>"#
);
}
#[test]
fn long_element_name() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b't', 1);
writer
.create_element(String::from("x").repeat(128).as_str())
.with_attribute(("first", "1"))
.new_line()
.with_attribute(("second", "2"))
.write_empty()
.expect("Problem with indentation reference");
}
}
mod in_attributes_multi {
use super::*;
use pretty_assertions::assert_eq;
#[test]
fn newline_first() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.new_line()
.with_attributes([("first", "1"), ("second", "2")])
.new_line()
.with_attributes([("third", "3"), ("fourth", "4")])
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
"<element\
\n_first=\"1\" second=\"2\"\
\n_third=\"3\" fourth=\"4\"/>"
);
}
#[test]
fn newline_inside() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.with_attributes([("first", "1"), ("second", "2")])
.new_line()
.with_attributes([("third", "3"), ("fourth", "4")])
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
r#"<element first="1" second="2"
third="3" fourth="4"/>"#
);
}
#[test]
fn newline_last() {
let mut buffer = Vec::new();
let mut writer = Writer::new_with_indent(&mut buffer, b'_', 1);
writer
.create_element("element")
.new_line()
.with_attributes([("first", "1"), ("second", "2")])
.new_line()
.with_attributes([("third", "3"), ("fourth", "4")])
.new_line()
.write_empty()
.expect("write tag failed");
writer
.create_element("element")
.with_attributes([("first", "1"), ("second", "2")])
.new_line()
.with_attributes([("third", "3"), ("fourth", "4")])
.new_line()
.write_empty()
.expect("write tag failed");
assert_eq!(
std::str::from_utf8(&buffer).unwrap(),
"<element\
\n_first=\"1\" second=\"2\"\
\n_third=\"3\" fourth=\"4\"\
\n/>\
\n<element first=\"1\" second=\"2\"\
\n third=\"3\" fourth=\"4\"\
\n/>"
);
}
}
}