xrust 2.0.3

Support for XPath and XSLT
Documentation
use crate::item::Node;
use crate::parser::combinators::alt::alt2;
use crate::parser::combinators::map::map;
use crate::parser::combinators::opt::opt;
use crate::parser::combinators::tag::tag;
use crate::parser::combinators::take::{take_one, take_while};
use crate::parser::combinators::tuple::{tuple2, tuple3, tuple5, tuple6, tuple8};
use crate::parser::combinators::wellformed::wellformed;
use crate::parser::combinators::whitespace::{whitespace0, whitespace1};
use crate::parser::xml::strings::delimited_string;
use crate::parser::{ParseError, ParseInput, StaticState};
use crate::xmldecl::XMLDecl;
use qualname::{NamespacePrefix, NamespaceUri};

fn xmldeclversion<'a, N: Node, L>()
-> impl Fn(ParseInput<'a, N>, &mut StaticState<L>) -> Result<(ParseInput<'a, N>, String), ParseError>
where
    L: FnMut(&NamespacePrefix) -> Result<NamespaceUri, ParseError>,
{
    move |input, ss| match tuple5(
        tag("version"),
        whitespace0(),
        tag("="),
        whitespace0(),
        delimited_string(),
    )(input, ss)
    {
        Ok((input1, (_, _, _, _, v))) => {
            if v.parse::<f64>().is_ok() {
                if v == *"1.1" {
                    Ok((input1, v))
                } else if v.starts_with("1.") {
                    Ok((input1, "1.0".to_string()))
                } else {
                    Err(ParseError::Notimplemented)
                }
            } else {
                Err(ParseError::NotWellFormed(format!(
                    "invalid XML version \"{}\"",
                    v
                )))
            }
        }
        Err(err) => Err(err),
    }
}

fn xmldeclstandalone<'a, N: Node, L>()
-> impl Fn(ParseInput<'a, N>, &mut StaticState<L>) -> Result<(ParseInput<'a, N>, String), ParseError>
where
    L: FnMut(&NamespacePrefix) -> Result<NamespaceUri, ParseError>,
{
    move |(input, state), ss| match map(
        wellformed(
            tuple6(
                whitespace1(),
                tag("standalone"),
                whitespace0(),
                tag("="),
                whitespace0(),
                delimited_string(),
            ),
            |(_, _, _, _, _, s)| ["yes".to_string(), "no".to_string()].contains(s),
            "invalid standalone value",
        ),
        |(_, _, _, _, _, s)| s,
    )((input, state), ss)
    {
        Err(e) => Err(e),
        Ok(((input2, mut state2), sta)) => {
            if &sta == "yes" {
                state2.standalone = true;
            }
            Ok(((input2, state2), sta))
        }
    }
}

pub(crate) fn encodingdecl<'a, N: Node, L>()
-> impl Fn(ParseInput<'a, N>, &mut StaticState<L>) -> Result<(ParseInput<'a, N>, String), ParseError>
where
    L: FnMut(&NamespacePrefix) -> Result<NamespaceUri, ParseError>,
{
    map(
        tuple6(
            whitespace1(),
            tag("encoding"),
            whitespace0(),
            tag("="),
            whitespace0(),
            //delimited_string(),
            alt2(
                tuple3(
                    tag("'"),
                    map(
                        tuple2(
                            wellformed(
                                take_one(),
                                |c| is_encname_startchar(*c),
                                "invalid character in XML encoding",
                            ),
                            take_while(is_encname_char),
                        ),
                        |(s, r)| [s.to_string(), r].concat(),
                    ),
                    tag("'"),
                ),
                tuple3(
                    tag("\""),
                    map(
                        tuple2(
                            wellformed(
                                take_one(),
                                |c| is_encname_startchar(*c),
                                "invalid character in XML encoding",
                            ),
                            take_while(is_encname_char),
                        ),
                        |(s, r)| [s.to_string(), r].concat(),
                    ),
                    tag("\""),
                ),
            ),
        ),
        |(_, _, _, _, _, (_, e, _))| e,
    )
}

pub(crate) fn xmldecl<'a, N: Node, L>()
-> impl Fn(ParseInput<'a, N>, &mut StaticState<L>) -> Result<(ParseInput<'a, N>, XMLDecl), ParseError>
where
    L: FnMut(&NamespacePrefix) -> Result<NamespaceUri, ParseError>,
{
    move |(input, state), ss| match tuple8(
        tag("<?xml"),
        whitespace1(),
        xmldeclversion(),
        opt(encodingdecl()),
        opt(xmldeclstandalone()),
        whitespace0(),
        tag("?>"),
        whitespace0(),
    )((input, state), ss)
    {
        Ok(((input1, mut state1), (_, _, ver, enc, sta, _, _, _))) => {
            // XML 1.0 (fifth edition): an external entity must include the encoding in its text declaration
            if state1.currentlyexternal && enc.is_none() {
                return Err(ParseError::NotWellFormed(String::from(
                    "missing encoding - external entity",
                )));
            }

            state1.xmlversion.clone_from(&ver);
            let res = XMLDecl {
                version: ver,
                encoding: enc,
                standalone: sta,
            };
            Ok(((input1, state1), res))
        }
        Err(e) => Err(e),
    }
}

pub(crate) fn is_encname_char(ch: char) -> bool {
    matches!(ch,
          'a'..='z'
        | 'A'..='Z'
        | '0'..='9'
        | '-'
        | '_'
        | '.'
    )
}

pub(crate) fn is_encname_startchar(ch: char) -> bool {
    ch.is_ascii_alphabetic()
}