use crate::convert::IntoAttributeValue;
use crate::error::{Error, Result};
use crate::namespaces::NSChoice;
use crate::node::Node;
use crate::prefixes::{Namespace, Prefix, Prefixes};
use crate::tree_builder::TreeBuilder;
use alloc::borrow::Cow;
use alloc::string::String;
use alloc::vec::Vec;
use core::slice;
use core::str::FromStr;
use std::borrow::Borrow;
use std::hash::Hash;
use std::io;
use rxml::writer::{Encoder, Item, TrackNamespace};
use rxml::{AttrMap, Namespace as RxmlNamespace, NcName, RawReader, XmlVersion};
fn encode_and_write<W: io::Write, T: rxml::writer::TrackNamespace>(
item: Item<'_>,
enc: &mut Encoder<T>,
mut w: W,
) -> io::Result<()> {
let mut buf = rxml::bytes::BytesMut::new();
enc.encode_into_bytes(item, &mut buf)
.expect("encoder driven incorrectly");
w.write_all(&buf[..])?;
Ok(())
}
pub struct CustomItemWriter<W, T> {
writer: W,
encoder: Encoder<T>,
}
impl<W: io::Write> CustomItemWriter<W, rxml::writer::SimpleNamespaces> {
pub(crate) fn new(writer: W) -> Self {
Self {
writer,
encoder: Encoder::new(),
}
}
}
impl<W: io::Write, T: rxml::writer::TrackNamespace> CustomItemWriter<W, T> {
pub(crate) fn write(&mut self, item: Item<'_>) -> io::Result<()> {
encode_and_write(item, &mut self.encoder, &mut self.writer)
}
}
pub type ItemWriter<W> = CustomItemWriter<W, rxml::writer::SimpleNamespaces>;
#[must_use]
pub fn escape(raw: &[u8]) -> Cow<'_, [u8]> {
fn to_escape(b: u8) -> bool {
matches!(b, b'<' | b'>' | b'\'' | b'&' | b'"')
}
let mut escapes: Vec<(usize, &'static [u8])> = Vec::new();
let mut bytes = raw.iter();
let mut loc = 0;
while let Some(i) = bytes.position(|&b| to_escape(b)) {
loc += i;
match raw[loc] {
b'<' => escapes.push((loc, b"<")),
b'>' => escapes.push((loc, b">")),
b'\'' => escapes.push((loc, b"'")),
b'&' => escapes.push((loc, b"&")),
b'"' => escapes.push((loc, b""")),
_ => unreachable!("Only '<', '>', '\'', '&' and '\"' are escaped"),
}
loc += 1;
}
if escapes.is_empty() {
Cow::Borrowed(raw)
} else {
let len = raw.len();
let mut v = Vec::with_capacity(len);
let mut start = 0;
for (i, r) in escapes {
v.extend_from_slice(&raw[start..i]);
v.extend_from_slice(r);
start = i + 1;
}
if start < len {
v.extend_from_slice(&raw[start..]);
}
Cow::Owned(v)
}
}
#[derive(Clone, Eq, Debug)]
pub struct Element {
name: String,
namespace: String,
pub prefixes: Prefixes,
attributes: AttrMap,
children: Vec<Node>,
}
impl<'a> From<&'a Element> for String {
fn from(elem: &'a Element) -> String {
let mut writer = Vec::new();
elem.write_to(&mut writer).unwrap();
String::from_utf8(writer).unwrap()
}
}
impl FromStr for Element {
type Err = Error;
fn from_str(s: &str) -> Result<Element> {
Element::from_reader(s.as_bytes())
}
}
impl PartialEq for Element {
fn eq(&self, other: &Self) -> bool {
if self.name() == other.name() && self.ns() == other.ns() && self.attrs().eq(other.attrs())
{
if self.nodes().count() != other.nodes().count() {
return false;
}
self.nodes()
.zip(other.nodes())
.all(|(node1, node2)| node1 == node2)
} else {
false
}
}
}
impl Element {
pub(crate) fn new<P: Into<Prefixes>>(
name: String,
namespace: String,
prefixes: P,
attributes: AttrMap,
children: Vec<Node>,
) -> Element {
Element {
name,
namespace,
prefixes: prefixes.into(),
attributes,
children,
}
}
pub fn builder<S: AsRef<str>, NS: Into<String>>(name: S, namespace: NS) -> ElementBuilder {
ElementBuilder {
root: Element::new(
name.as_ref().to_string(),
namespace.into(),
None,
AttrMap::new(),
Vec::new(),
),
}
}
pub fn bare<S: Into<String>, NS: Into<String>>(name: S, namespace: NS) -> Element {
Element::new(
name.into(),
namespace.into(),
None,
AttrMap::new(),
Vec::new(),
)
}
#[must_use]
pub fn name(&self) -> &str {
&self.name
}
#[must_use]
pub fn ns(&self) -> String {
self.namespace.clone()
}
#[must_use]
pub fn attr<'a, N: Ord + Hash + Eq + ?Sized>(&'a self, name: &'a N) -> Option<&'a str>
where
NcName: Borrow<N>,
{
if let Some(value) = self.attributes.get(&RxmlNamespace::NONE, name) {
return Some(value);
}
None
}
#[must_use]
pub fn attr_ns<'a, NS: Ord + Hash + Eq + ?Sized, N: Ord + Hash + Eq + ?Sized>(
&'a self,
ns: &'a NS,
name: &'a N,
) -> Option<&'a str>
where
RxmlNamespace: Borrow<NS>,
NcName: Borrow<N>,
{
if let Some(value) = self.attributes.get(ns, name) {
return Some(value);
}
None
}
#[must_use]
pub fn attrs(&self) -> &AttrMap {
&self.attributes
}
#[must_use]
pub fn attrs_mut(&mut self) -> &mut AttrMap {
&mut self.attributes
}
pub fn set_attr<V: IntoAttributeValue>(&mut self, ns: RxmlNamespace, name: NcName, val: V) {
let val = val.into_attribute_value();
if let Some(value) = self.attributes.get_mut(&ns, &name) {
*value = val
.expect("removing existing value via set_attr, this is not yet supported (TODO)"); return;
}
if let Some(val) = val {
self.attributes.insert(ns.clone(), name, val);
}
}
pub fn is<'a, N: AsRef<str>, NS: Into<NSChoice<'a>>>(&self, name: N, namespace: NS) -> bool {
self.name == name.as_ref() && namespace.into().compare(self.namespace.as_ref())
}
pub fn has_ns<'a, NS: Into<NSChoice<'a>>>(&self, namespace: NS) -> bool {
namespace.into().compare(self.namespace.as_ref())
}
fn from_reader_inner<R: io::BufRead>(
mut tree_builder: TreeBuilder,
reader: R,
) -> Result<Element> {
let mut driver = RawReader::new(reader);
while let Some(event) = driver.read()? {
tree_builder.process_event(event)?;
if let Some(root) = tree_builder.root.take() {
return Ok(root);
}
}
Err(Error::EndOfDocument)
}
pub fn from_reader<R: io::BufRead>(reader: R) -> Result<Element> {
Element::from_reader_inner(TreeBuilder::new(), reader)
}
pub fn from_reader_with_prefixes<R: io::BufRead, P: Into<Prefixes>>(
reader: R,
prefixes: P,
) -> Result<Element> {
let tree_builder = TreeBuilder::new().with_prefixes_stack([prefixes.into()].into());
Element::from_reader_inner(tree_builder, reader)
}
pub fn write_to<W: io::Write>(&self, writer: &mut W) -> Result<()> {
self.to_writer(&mut ItemWriter::new(writer))
}
pub fn write_to_decl<W: io::Write>(&self, writer: &mut W) -> Result<()> {
self.to_writer_decl(&mut ItemWriter::new(writer))
}
pub fn to_writer<W: io::Write>(&self, writer: &mut ItemWriter<W>) -> Result<()> {
self.write_to_inner(writer)
}
pub fn to_writer_decl<W: io::Write>(&self, writer: &mut ItemWriter<W>) -> Result<()> {
writer
.write(Item::XmlDeclaration(XmlVersion::V1_0))
.unwrap(); self.write_to_inner(writer)
}
pub fn write_to_inner<W: io::Write>(&self, writer: &mut ItemWriter<W>) -> Result<()> {
for (prefix, namespace) in self.prefixes.declared_prefixes() {
assert!(writer.encoder.ns_tracker_mut().declare_fixed(
prefix.as_deref().map(TryInto::try_into).transpose()?,
namespace.clone().into(),
));
}
let namespace: RxmlNamespace = self.namespace.clone().into();
writer.write(Item::ElementHeadStart(&namespace, (*self.name).try_into()?))?;
for ((ns, key), value) in &self.attributes {
writer.write(Item::Attribute(&ns, key, value))?;
}
if !self.children.is_empty() {
writer.write(Item::ElementHeadEnd)?;
for child in &self.children {
child.write_to_inner(writer)?;
}
}
writer.write(Item::ElementFoot)?;
Ok(())
}
pub fn take_nodes(&mut self) -> Vec<Node> {
self.children.drain(..).collect()
}
#[inline]
pub fn nodes(&self) -> Nodes<'_> {
self.children.iter()
}
#[inline]
pub fn nodes_mut(&mut self) -> NodesMut<'_> {
self.children.iter_mut()
}
#[inline]
#[must_use]
pub fn children(&self) -> Children<'_> {
Children {
iter: self.children.iter(),
}
}
#[inline]
#[must_use]
pub fn children_mut(&mut self) -> ChildrenMut<'_> {
ChildrenMut {
iter: self.children.iter_mut(),
}
}
#[inline]
#[doc(hidden)]
pub fn take_contents_as_children(&mut self) -> ContentsAsChildren<'_> {
ContentsAsChildren {
iter: self.children.drain(..),
}
}
#[inline]
#[must_use]
pub fn texts(&self) -> Texts<'_> {
Texts {
iter: self.children.iter(),
}
}
#[inline]
#[must_use]
pub fn texts_mut(&mut self) -> TextsMut<'_> {
TextsMut {
iter: self.children.iter_mut(),
}
}
pub fn append_child(&mut self, child: Element) -> &mut Element {
self.children.push(Node::Element(child));
if let Node::Element(ref mut cld) = *self.children.last_mut().unwrap() {
cld
} else {
unreachable!()
}
}
pub fn append_text_node<S: Into<String>>(&mut self, child: S) {
self.children.push(Node::Text(child.into()));
}
pub fn append_text<S: Into<String>>(&mut self, text: S) {
if let Some(Node::Text(ref mut child)) = self.children.last_mut() {
child.push_str(&text.into());
} else {
self.append_text_node(text);
}
}
pub fn append_node(&mut self, node: Node) {
self.children.push(node);
}
#[must_use]
pub fn text(&self) -> String {
self.texts().fold(String::new(), |ret, new| ret + new)
}
pub fn get_child<'a, N: AsRef<str>, NS: Into<NSChoice<'a>>>(
&self,
name: N,
namespace: NS,
) -> Option<&Element> {
let namespace = namespace.into();
for fork in &self.children {
if let Node::Element(ref e) = *fork {
if e.is(name.as_ref(), namespace) {
return Some(e);
}
}
}
None
}
pub fn get_child_mut<'a, N: AsRef<str>, NS: Into<NSChoice<'a>>>(
&mut self,
name: N,
namespace: NS,
) -> Option<&mut Element> {
let namespace = namespace.into();
for fork in &mut self.children {
if let Node::Element(ref mut e) = *fork {
if e.is(name.as_ref(), namespace) {
return Some(e);
}
}
}
None
}
pub fn has_child<'a, N: AsRef<str>, NS: Into<NSChoice<'a>>>(
&self,
name: N,
namespace: NS,
) -> bool {
self.get_child(name, namespace).is_some()
}
pub fn remove_child<'a, N: AsRef<str>, NS: Into<NSChoice<'a>>>(
&mut self,
name: N,
namespace: NS,
) -> Option<Element> {
let name = name.as_ref();
let namespace = namespace.into();
let idx = self.children.iter().position(|x| {
if let Node::Element(ref elm) = x {
elm.is(name, namespace)
} else {
false
}
})?;
self.children.remove(idx).into_element()
}
pub fn unshift_child(&mut self) -> Option<Element> {
while !self.children.is_empty() {
if let Some(el) = self.children.remove(0).into_element() {
return Some(el);
}
}
None
}
}
pub struct Children<'a> {
iter: slice::Iter<'a, Node>,
}
impl<'a> Iterator for Children<'a> {
type Item = &'a Element;
fn next(&mut self) -> Option<&'a Element> {
for item in &mut self.iter {
if let Node::Element(ref child) = *item {
return Some(child);
}
}
None
}
}
pub struct ChildrenMut<'a> {
iter: slice::IterMut<'a, Node>,
}
impl<'a> Iterator for ChildrenMut<'a> {
type Item = &'a mut Element;
fn next(&mut self) -> Option<&'a mut Element> {
for item in &mut self.iter {
if let Node::Element(ref mut child) = *item {
return Some(child);
}
}
None
}
}
pub struct ContentsAsChildren<'a> {
iter: alloc::vec::Drain<'a, Node>,
}
impl Iterator for ContentsAsChildren<'_> {
type Item = Element;
fn next(&mut self) -> Option<Element> {
for item in &mut self.iter {
if let Node::Element(child) = item {
return Some(child);
}
}
None
}
}
pub struct Texts<'a> {
iter: slice::Iter<'a, Node>,
}
impl<'a> Iterator for Texts<'a> {
type Item = &'a str;
fn next(&mut self) -> Option<&'a str> {
for item in &mut self.iter {
if let Node::Text(ref child) = *item {
return Some(child);
}
}
None
}
}
pub struct TextsMut<'a> {
iter: slice::IterMut<'a, Node>,
}
impl<'a> Iterator for TextsMut<'a> {
type Item = &'a mut String;
fn next(&mut self) -> Option<&'a mut String> {
for item in &mut self.iter {
if let Node::Text(ref mut child) = *item {
return Some(child);
}
}
None
}
}
pub type Nodes<'a> = slice::Iter<'a, Node>;
pub type NodesMut<'a> = slice::IterMut<'a, Node>;
pub struct ElementBuilder {
root: Element,
}
impl ElementBuilder {
pub fn prefix<S: Into<Namespace>>(
mut self,
prefix: Prefix,
namespace: S,
) -> Result<ElementBuilder> {
if self.root.prefixes.get(&prefix).is_some() {
return Err(Error::DuplicatePrefix);
}
self.root.prefixes.insert(prefix, namespace.into());
Ok(self)
}
#[must_use]
pub fn attr<V: IntoAttributeValue>(mut self, name: NcName, value: V) -> ElementBuilder {
self.root.set_attr(RxmlNamespace::NONE, name, value);
self
}
#[must_use]
pub fn attr_ns<V: IntoAttributeValue>(
mut self,
ns: RxmlNamespace,
name: NcName,
value: V,
) -> ElementBuilder {
self.root.set_attr(ns, name, value);
self
}
#[must_use]
pub fn append<T: Into<Node>>(mut self, node: T) -> ElementBuilder {
self.root.append_node(node.into());
self
}
#[must_use]
pub fn append_all<T: Into<Node>, I: IntoIterator<Item = T>>(
mut self,
iter: I,
) -> ElementBuilder {
for node in iter {
self.root.append_node(node.into());
}
self
}
#[must_use]
pub fn build(self) -> Element {
self.root
}
}
#[cfg(test)]
mod tests {
use super::*;
use rxml::xml_ncname;
use std::collections::BTreeMap;
#[test]
fn test_element_new() {
let mut attrs = AttrMap::new();
attrs.insert(
String::from("namespace").into(),
xml_ncname!("name").to_owned(),
"value".to_string(),
);
let elem = Element::new(
"name".to_owned(),
"namespace".to_owned(),
(None, "namespace".to_owned()),
attrs,
Vec::new(),
);
assert_eq!(elem.name(), "name");
assert_eq!(elem.ns(), "namespace".to_owned());
assert_eq!(elem.attr_ns("namespace", "name"), Some("value"));
assert_eq!(elem.attr("inexistent"), None);
}
#[test]
fn test_from_reader_simple() {
let xml = b"<foo xmlns='ns1'></foo>";
let elem = Element::from_reader(&xml[..]);
let elem2 = Element::builder("foo", "ns1").build();
assert_eq!(elem.unwrap(), elem2);
}
#[test]
fn test_from_reader_nested() {
let xml = b"<foo xmlns='ns1'><bar xmlns='ns1' baz='qxx' /></foo>";
let elem = Element::from_reader(&xml[..]);
let nested = Element::builder("bar", "ns1")
.attr(xml_ncname!("baz").to_owned(), "qxx")
.build();
let elem2 = Element::builder("foo", "ns1").append(nested).build();
assert_eq!(elem.unwrap(), elem2);
}
#[test]
fn test_from_reader_with_prefix() {
let xml = b"<foo xmlns='ns1'><prefix:bar xmlns:prefix='ns1' baz='qxx' /></foo>";
let elem = Element::from_reader(&xml[..]);
let nested = Element::builder("bar", "ns1")
.attr(xml_ncname!("baz").to_owned(), "qxx")
.build();
let elem2 = Element::builder("foo", "ns1").append(nested).build();
assert_eq!(elem.unwrap(), elem2);
}
#[test]
fn test_from_reader_split_prefix() {
let xml = b"<foo:bar xmlns:foo='ns1'/>";
let elem = Element::from_reader(&xml[..]).unwrap();
assert_eq!(elem.name(), String::from("bar"));
assert_eq!(elem.ns(), String::from("ns1"));
assert_eq!(
elem.prefixes.get(&Some(String::from("foo"))),
Some(&String::from("ns1"))
);
}
#[test]
fn parses_spectest_xml() {
let xml = br#"<rng:grammar xmlns:rng="http://relaxng.org/ns/structure/1.0">
<rng:name xmlns:rng="http://relaxng.org/ns/structure/1.0"></rng:name>
</rng:grammar>
"#;
let _ = Element::from_reader(&xml[..]).unwrap();
}
#[test]
fn does_not_unescape_cdata() {
let xml = b"<test xmlns='test'><![CDATA['>blah<blah>]]></test>";
let elem = Element::from_reader(&xml[..]).unwrap();
assert_eq!(elem.text(), "'>blah<blah>");
}
#[test]
fn test_compare_all_ns() {
let xml = b"<foo xmlns='foo' xmlns:bar='baz'><bar:meh xmlns:bar='baz' /></foo>";
let elem = Element::from_reader(&xml[..]).unwrap();
let elem2 = elem.clone();
let xml3 = b"<foo xmlns='foo'><bar:meh xmlns:bar='baz'/></foo>";
let elem3 = Element::from_reader(&xml3[..]).unwrap();
let xml4 = b"<prefix:foo xmlns:prefix='foo'><bar:meh xmlns:bar='baz'/></prefix:foo>";
let elem4 = Element::from_reader(&xml4[..]).unwrap();
assert_eq!(elem, elem2);
assert_eq!(elem, elem3);
assert_eq!(elem, elem4);
}
#[test]
fn test_compare_empty_children() {
let elem1 = Element::bare("p", "");
let elem2 = Element::builder("p", "")
.append(Node::Element(Element::bare("span", "")))
.build();
assert_ne!(elem1, elem2);
}
#[test]
fn test_from_reader_with_prefixes() {
let xml = b"<foo><bar xmlns='baz'/></foo>";
let elem =
Element::from_reader_with_prefixes(&xml[..], String::from("jabber:client")).unwrap();
let xml2 = b"<foo xmlns='jabber:client'><bar xmlns='baz'/></foo>";
let elem2 = Element::from_reader(&xml2[..]).unwrap();
assert_eq!(elem, elem2);
}
#[test]
fn test_from_reader_with_prefixes_serialization() {
let prefixes: BTreeMap<Option<String>, String> = {
let mut tmp = BTreeMap::new();
tmp.insert(None, String::from("foo"));
tmp.insert(Some(String::from("test")), String::from("bar"));
tmp
};
let input = r#"<foo test:attr="true"><bar/></foo>"#;
let output = r#"<foo xmlns='foo' xmlns:test='bar' test:attr='true'><bar/></foo>"#;
let elem = Element::from_reader_with_prefixes(input.as_ref(), prefixes).unwrap();
assert_eq!(String::from(&elem), output);
}
#[test]
fn failure_with_duplicate_namespace() {
let _: Element = r###"<?xml version="1.0" encoding="UTF-8"?>
<wsdl:definitions
xmlns:wsdl="http://schemas.xmlsoap.org/wsdl/"
xmlns:xsd="http://www.w3.org/2001/XMLSchema">
<wsdl:types>
<xsd:schema xmlns:xs="http://www.w3.org/2001/XMLSchema">
</xsd:schema>
</wsdl:types>
</wsdl:definitions>
"###
.parse()
.unwrap();
}
}