xrust 2.0.3

Support for XPath and XSLT
Documentation
use crate::item::Node;
use crate::parser::combinators::alt::{alt3, alt4};
use crate::parser::combinators::delimited::delimited;
use crate::parser::combinators::many::many0;
use crate::parser::combinators::map::map;
use crate::parser::combinators::tag::tag;
use crate::parser::combinators::take::{take_until, take_until_either_or_min1, take_until_end};
use crate::parser::combinators::tuple::{tuple2, tuple7};
use crate::parser::combinators::wellformed::{wellformed, wellformed_ver};
use crate::parser::combinators::whitespace::{whitespace0, whitespace1};
use crate::parser::common::{is_char10, is_char11, is_unrestricted_char11};
use crate::parser::xml::chardata::chardata_unicode_codepoint;
use crate::parser::xml::dtd::externalid::textexternalid;
use crate::parser::xml::dtd::intsubset::intsubset;
use crate::parser::xml::dtd::pereference::petextreference;
use crate::parser::xml::qname::qualname_to_parts;
use crate::parser::{ParseError, ParseInput, StaticState};
use qualname::{NamespacePrefix, NamespaceUri};

pub(crate) fn gedecl<'a, N: Node, L>()
-> impl Fn(ParseInput<'a, N>, &mut StaticState<L>) -> Result<(ParseInput<'a, N>, ()), ParseError>
where
    L: FnMut(&NamespacePrefix) -> Result<NamespaceUri, ParseError>,
{
    move |input, ss| match wellformed_ver(
        tuple7(
            tag("<!ENTITY"),
            whitespace1(),
            wellformed(
                qualname_to_parts(),
                |(p, _)| p.is_none(),
                "entity name has colon",
            ),
            whitespace1(),
            alt3(
                textexternalid(),
                delimited(tag("'"), take_until("'"), tag("'")),
                delimited(tag("\""), take_until("\""), tag("\"")),
            ),
            whitespace0(),
            tag(">"),
        ),
        |(_, _, _, _, s, _, _)| !s.contains(|c: char| !is_char10(&c)), //XML 1.0
        |(_, _, _, _, s, _, _)| !s.contains(|c: char| !is_unrestricted_char11(&c)), //XML 1.1
        "entity name has invalid characters",
    )(input, ss)
    {
        Ok(((input2, mut state2), (_, _, (_, l), _, s, _, _))) => {
            /*
            Numeric and other entities expanded immediately, since there'll be namespaces and the like to
            deal with later, after that we just store the entity as a string and parse again when called.
             */
            if !state2.currentlyexternal && s.contains('%') {
                return Err(ParseError::NotWellFormed(format!(
                    "cannot expand parameter entity \"{}\"",
                    s
                )));
            }

            let entityparse = map(
                tuple2(
                    map(
                        many0(alt4(
                            //we leave the &#13; or #xD; as is, as it will be converted later if needed and we don't want the \r character stripped later.
                            map(
                                wellformed_ver(
                                    chardata_unicode_codepoint(),
                                    is_char10,
                                    is_char11,
                                    "invalid Unicode codepoint",
                                ),
                                |c| {
                                    if c == '\r' {
                                        "&#13;".to_string()
                                    } else {
                                        c.to_string()
                                    }
                                },
                            ),
                            petextreference(),
                            //General entity is ignored.
                            map(delimited(tag("&"), take_until(";"), tag(";")), |s| {
                                ["&".to_string(), s, ";".to_string()].concat()
                            }),
                            take_until_either_or_min1("&", "%"),
                        )),
                        |ve| ve.concat(),
                    ),
                    wellformed(
                        take_until_end(),
                        |s| !s.contains('&') && !s.contains('%'),
                        "entity not allowed",
                    ),
                ),
                |(a, b)| [a, b].concat(),
            )((s.as_str(), state2.clone()), ss);

            match entityparse {
                Ok(((_, _), res)) => {
                    if !state2.currentlyexternal {
                        match intsubset()((res.as_str(), state2.clone()), ss) {
                            Ok(_) => {}
                            Err(_) => {
                                return Err(ParseError::NotWellFormed(format!(
                                    "unable to parse entity \"{}\"",
                                    res.clone()
                                )));
                            }
                        }
                    };

                    /* Entities should always bind to the first value */
                    let replaceable = state2.currentlyexternal;
                    match state2.dtd.generalentities.get(l.as_str()) {
                        None => {
                            state2.dtd.generalentities.insert(l, (res, replaceable));
                            Ok(((input2, state2), ()))
                        }
                        Some((_, true)) => {
                            state2
                                .dtd
                                .generalentities
                                .entry(l)
                                .or_insert((res, replaceable));
                            Ok(((input2, state2), ()))
                        }
                        _ => Ok(((input2, state2), ())),
                    }
                }
                Err(e) => Err(e),
            }
        }
        Err(err) => Err(err),
    }
}