styx-parse 3.0.2

Event-based parser for the Styx configuration language
Documentation
//! Event types for the Styx event-based parser.

use std::borrow::Cow;

use styx_tokenizer::Span;

/// An event emitted by the parser, with its source location.
#[derive(Debug, Clone, PartialEq, Eq)]
pub struct Event<'src> {
    /// The source location associated with this event.
    pub span: Span,
    /// The kind of event.
    pub kind: EventKind<'src>,
}

/// The kind of event emitted by the parser.
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum EventKind<'src> {
    // Document boundaries
    /// Start of document.
    DocumentStart,
    /// End of document.
    DocumentEnd,

    // Objects
    /// Start of an object `{ ... }`.
    ObjectStart,
    /// End of an object.
    ObjectEnd,

    // Sequences
    /// Start of a sequence `( ... )`.
    SequenceStart,
    /// End of a sequence.
    SequenceEnd,

    // Entry structure (within objects)
    /// Start of an entry (key-value pair).
    EntryStart,
    /// A key in an entry.
    ///
    /// Keys can be scalars or unit, optionally tagged.
    /// Objects, sequences, and heredocs are not allowed as keys.
    Key {
        /// Tag name if this key is tagged (without @).
        tag: Option<&'src str>,
        /// Scalar payload after escape processing. None means unit.
        payload: Option<Cow<'src, str>>,
        /// Kind of scalar used for the key. Only meaningful if payload is Some.
        kind: ScalarKind,
    },
    /// End of an entry.
    EntryEnd,

    // Values
    /// A scalar value.
    Scalar {
        /// Value after escape processing.
        value: Cow<'src, str>,
        /// Kind of scalar.
        kind: ScalarKind,
    },
    /// Unit value `@`.
    Unit,

    // Tags
    /// Start of a tag `@name`.
    TagStart {
        /// Tag name (without @).
        name: &'src str,
    },
    /// End of a tag.
    TagEnd,

    // Comments
    /// Line comment `// ...`.
    Comment {
        /// Comment text (including //).
        text: &'src str,
    },
    /// Doc comment `/// ...`.
    DocComment {
        /// Doc comment lines (without `/// ` prefix).
        lines: Vec<&'src str>,
    },

    // Errors
    /// Parse error.
    Error {
        /// Kind of error.
        kind: ParseErrorKind,
    },
}

/// Kind of scalar.
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
#[cfg_attr(feature = "facet", derive(facet::Facet))]
#[repr(u8)]
pub enum ScalarKind {
    /// Bare (unquoted) scalar.
    Bare,
    /// Quoted string `"..."`.
    Quoted,
    /// Raw string `r#"..."#`.
    Raw,
    /// Heredoc `<<DELIM...DELIM`.
    Heredoc,
}

/// Parse error kinds.
#[derive(Debug, Clone, PartialEq, Eq)]
pub enum ParseErrorKind {
    /// Unexpected token.
    UnexpectedToken,
    /// Unclosed object (missing `}`).
    UnclosedObject,
    /// Unclosed sequence (missing `)`).
    UnclosedSequence,
    /// Invalid escape sequence in quoted string.
    InvalidEscape(String),
    /// Expected a key.
    ExpectedKey,
    /// Expected a value.
    ExpectedValue,
    /// Unexpected end of input.
    UnexpectedEof,
    /// Duplicate key in object. Contains the span of the first occurrence.
    // parser[impl entry.key-equality]
    DuplicateKey { original: Span },
    /// Invalid tag name (must match pattern).
    InvalidTagName,
    /// Invalid key (e.g., heredoc used as key).
    InvalidKey,
    /// Dangling doc comment (not followed by entry).
    DanglingDocComment,
    /// Too many atoms in entry (expected at most 2: key and value).
    // parser[impl entry.toomany]
    TooManyAtoms,
    /// Attempted to reopen a path that was closed when a sibling appeared.
    // parser[impl entry.path.reopen]
    ReopenedPath {
        /// The closed path that was attempted to be reopened.
        closed_path: Vec<String>,
    },
    /// Attempted to nest into a path that has a terminal value (scalar/sequence/tag/unit).
    NestIntoTerminal {
        /// The path that has a terminal value.
        terminal_path: Vec<String>,
    },
    /// Comma in sequence (sequences are whitespace-separated, not comma-separated).
    CommaInSequence,
    /// Missing whitespace between bare scalar and `{` or `(`.
    // parser[impl entry.whitespace]
    MissingWhitespaceBeforeBlock,
    /// Trailing content after explicit root object.
    TrailingContent,
}

impl std::fmt::Display for ParseErrorKind {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        match self {
            ParseErrorKind::UnexpectedToken => write!(f, "unexpected token"),
            ParseErrorKind::UnclosedObject => write!(f, "unclosed object (missing `}}`)"),
            ParseErrorKind::UnclosedSequence => write!(f, "unclosed sequence (missing `)`)"),
            ParseErrorKind::InvalidEscape(seq) => write!(f, "invalid escape sequence: {}", seq),
            ParseErrorKind::ExpectedKey => write!(f, "expected a key"),
            ParseErrorKind::ExpectedValue => write!(f, "expected a value"),
            ParseErrorKind::UnexpectedEof => write!(f, "unexpected end of input"),
            ParseErrorKind::DuplicateKey { .. } => write!(f, "duplicate key"),
            ParseErrorKind::InvalidTagName => write!(f, "invalid tag name"),
            ParseErrorKind::InvalidKey => write!(f, "invalid key"),
            ParseErrorKind::DanglingDocComment => {
                write!(f, "doc comment not followed by an entry")
            }
            ParseErrorKind::TooManyAtoms => {
                write!(f, "unexpected atom after value (entry has too many atoms)")
            }
            ParseErrorKind::ReopenedPath { closed_path } => {
                write!(
                    f,
                    "cannot reopen path `{}` after sibling appeared",
                    closed_path.join(".")
                )
            }
            ParseErrorKind::NestIntoTerminal { terminal_path } => {
                write!(
                    f,
                    "cannot nest into `{}` which has a terminal value",
                    terminal_path.join(".")
                )
            }
            ParseErrorKind::CommaInSequence => {
                write!(
                    f,
                    "unexpected `,` in sequence (sequences are whitespace-separated, not comma-separated)"
                )
            }
            ParseErrorKind::MissingWhitespaceBeforeBlock => {
                write!(
                    f,
                    "missing whitespace before `{{` or `(` (required after bare scalar to distinguish from tag syntax like `@tag{{}}`)"
                )
            }
            ParseErrorKind::TrailingContent => {
                write!(f, "trailing content after explicit root object")
            }
        }
    }
}