Skip to main content

mpl_lang/
errors.rs

1//! Error types and diagnostics for `MPL` parsing.
2#![allow(unused_assignments)] // We need this for the parse error
3
4use std::fmt::{self, Write as _};
5
6use miette::{Diagnostic, SourceSpan};
7use pest::{
8    error::{Error as PestError, ErrorVariant, InputLocation, LineColLocation},
9    iterators::Pair,
10};
11use strsim::jaro;
12
13use crate::{parser::Rule, query::ParamDeclaration};
14
15/// `MPL` parsing error
16#[derive(thiserror::Error, Debug, Diagnostic)]
17pub enum ParseError {
18    /// Syntax error with source location.
19    #[error("MPL syntax error: {message}")]
20    #[diagnostic(code(mpl_lang::syntax_error))]
21    SyntaxError {
22        /// The source location of the error with detailed message
23        #[label("{label}")]
24        span: SourceSpan,
25        /// Short label for the inline source annotation
26        label: String,
27        /// The detailed error message
28        message: String,
29        /// Optional suggestion for fixing the error
30        #[help]
31        suggestion: Option<Suggestion>,
32    },
33
34    #[error("This feature is not supported at the moment: {rule:?}")]
35    /// Rule for a unsupported feature
36    #[diagnostic(
37        code(mpl_lang::not_supported),
38        help("This feature may be added in a future version")
39    )]
40    NotSupported {
41        /// The source location of the unsupported feature
42        #[label("unsupported: {rule:?}")]
43        span: SourceSpan,
44        /// The rule that is not supported
45        rule: Rule,
46    },
47
48    /// Unexpected rule
49    #[error("Unexpected rule: {rule:?} expected one of {expected:?}")]
50    #[diagnostic(code(mpl_lang::unexpected_rule))]
51    Unexpected {
52        /// The source location of the unexpected rule
53        #[label("unexpected {rule:?}")]
54        span: SourceSpan,
55        /// The rule that was unexpected
56        rule: Rule,
57        /// Expected rules
58        expected: Vec<Rule>,
59    },
60
61    /// Unexpected Token
62    #[error("Found unexpected tokens: {rules:?}")]
63    #[diagnostic(code(mpl_lang::unexpected_tokens))]
64    UnexpectedTokens {
65        /// The source location of the unexpected tokens
66        #[label("unexpected tokens")]
67        span: SourceSpan,
68        /// The unexpected rules
69        rules: Vec<Rule>,
70    },
71
72    /// Unexpected EOF
73    #[error("Unexpected end of input")]
74    #[diagnostic(
75        code(mpl_lang::unexpected_eof),
76        help("The query appears to be incomplete")
77    )]
78    EOF {
79        /// The source location where more input was expected
80        #[label("expected more input here")]
81        span: SourceSpan,
82    },
83
84    /// Invalid Floating point number
85    #[error("Invalid float: {0}")]
86    #[diagnostic(code(mpl_lang::invalid_float))]
87    InvalidFloat(#[from] std::num::ParseFloatError),
88
89    /// Invalid Integer
90    #[error("Invalid integer: {0}")]
91    #[diagnostic(code(mpl_lang::invalid_integer))]
92    InvalidInteger(#[from] std::num::ParseIntError),
93
94    /// Invalid bool
95    #[error("Invalid bool: {0}")]
96    #[diagnostic(code(mpl_lang::invalid_bool))]
97    InvalidBool(#[from] std::str::ParseBoolError),
98
99    /// Invalid date
100    #[error("Invalid date: {0}")]
101    #[diagnostic(code(mpl_lang::invalid_date))]
102    InvalidDate(#[from] chrono::ParseError),
103
104    /// Invalid Regex
105    #[error("Invalid Regex: {0}")]
106    #[diagnostic(code(mpl_lang::invalid_regex))]
107    InvalidRegex(#[from] regex::Error),
108
109    /// Unsupported align function
110    #[error("Unsupported align function: {name}")]
111    #[diagnostic(
112        code(mpl_lang::unsupported_align_function),
113        help("Check the documentation for available align functions")
114    )]
115    UnsupportedAlignFunction {
116        /// The source location of the unsupported function
117        #[label("unknown function")]
118        span: SourceSpan,
119        /// The name of the unsupported function
120        name: String,
121    },
122
123    /// Unsupported group function
124    #[error("Unsupported group function: {name}")]
125    #[diagnostic(
126        code(mpl_lang::unsupported_group_function),
127        help("Check the documentation for available group functions")
128    )]
129    UnsupportedGroupFunction {
130        /// The source location of the unsupported function
131        #[label("unknown function")]
132        span: SourceSpan,
133        /// The name of the unsupported function
134        name: String,
135    },
136
137    /// Unsupported compute function
138    #[error("Unsupported compute function: {name}")]
139    #[diagnostic(
140        code(mpl_lang::unsupported_compute_function),
141        help("Check the documentation for available compute functions")
142    )]
143    UnsupportedComputeFunction {
144        /// The source location of the unsupported function
145        #[label("unknown function")]
146        span: SourceSpan,
147        /// The name of the unsupported function
148        name: String,
149    },
150
151    /// Unsupported bucketing function
152    #[error("Unsupported bucket function: {name}")]
153    #[diagnostic(
154        code(mpl_lang::unsupported_bucket_function),
155        help(
156            "Available functions: histogram, interpolate_delta_histogram, interpolate_cumulative_histogram"
157        )
158    )]
159    UnsupportedBucketFunction {
160        /// The source location of the unsupported function
161        #[label("unknown function")]
162        span: SourceSpan,
163        /// The name of the unsupported function
164        name: String,
165    },
166
167    /// Unsupported map evaluation
168    #[error("Unsupported map evaluation: {name}")]
169    #[diagnostic(
170        code(mpl_lang::unsupported_map_evaluation),
171        help("Check the documentation for available map operations")
172    )]
173    UnsupportedMapEvaluation {
174        /// The source location of the unsupported operation
175        #[label("unknown operation")]
176        span: SourceSpan,
177        /// The name of the unsupported operation
178        name: String,
179    },
180
181    /// Unsupported map function
182    #[error("Unsupported map function: {name}")]
183    #[diagnostic(
184        code(mpl_lang::unsupported_map_function),
185        help("Check the documentation for available map functions")
186    )]
187    UnsupportedMapFunction {
188        /// The source location of the unsupported function
189        #[label("unknown function")]
190        span: SourceSpan,
191        /// The name of the unsupported function
192        name: String,
193    },
194
195    /// Unsupported regexp comparison
196    #[error("Unsupported regexp comparison: {op}")]
197    #[diagnostic(
198        code(mpl_lang::unsupported_regexp_comparison),
199        help("Use '==' or '!=' for regex comparisons")
200    )]
201    UnsupportedRegexpComparison {
202        /// The source location of the unsupported operator
203        #[label("invalid operator")]
204        span: SourceSpan,
205        /// The unsupported operator
206        op: String,
207    },
208
209    /// Unsupported comparison against tag value
210    #[error("Unsupported tag comparison: {op}")]
211    #[diagnostic(
212        code(mpl_lang::unsupported_tag_comparison),
213        help("Supported operators: ==, !=, >, >=, <, <=")
214    )]
215    UnsupportedTagComparison {
216        /// The source location of the unsupported operator
217        #[label("invalid operator")]
218        span: SourceSpan,
219        /// The unsupported operator
220        op: String,
221    },
222
223    /// The feature is not implemented yet
224    #[error("Not implemented: {0}")]
225    #[diagnostic(
226        code(mpl_lang::not_implemented),
227        help("This feature is planned but not yet implemented")
228    )]
229    NotImplemented(&'static str),
230
231    /// Strumbra error
232    #[error("String construction error: {0}")]
233    #[diagnostic(code(mpl_lang::strumbra_error))]
234    StrumbraError(#[from] strumbra::Error),
235
236    /// Unreachable error
237    #[error("Unreachable error: {0}")]
238    #[diagnostic(
239        code(mpl_lang::unreachable),
240        help("This error should never be reached")
241    )]
242    Unreachable(&'static str),
243
244    /// Param is defined multiple times
245    #[error("The param ${param} is defined multiple times")]
246    #[diagnostic(
247        code(mpl_lang::param_defined_multiple_times),
248        help("This param has been defined more than once")
249    )]
250    ParamDefinedMultipleTimes {
251        /// The source location of the duplicate definition
252        #[label("duplicate definition")]
253        span: SourceSpan,
254        /// The param
255        param: String,
256    },
257
258    // commented out until this becomes an error, for now it's a warning
259    // /// Param is using the prefix reserved for system params
260    // #[error("The param ${param} is using a prefix reserved for system params")]
261    // #[diagnostic(
262    //     code(mpl_lang::param_reserved_prefix),
263    //     help("The prefix `__` is reserved for system parameters")
264    // )]
265    // ParamUsingSystemPrefix {
266    //     /// The source location of the param
267    //     #[label("invalid prefix")]
268    //     span: SourceSpan,
269    //     /// The param
270    //     param: String,
271    // },
272    /// The system param is not using the prefix
273    #[error("The system param ${param} is missing the system prefix")]
274    #[diagnostic(
275        code(mpl_lan::system_param_missing_prefix),
276        help("The system param is missing the `__` prefix")
277    )]
278    SystemParamMissingPrefix {
279        /// The param
280        param: String,
281    },
282
283    /// Param is not defined
284    #[error("The param ${param} is not defined")]
285    #[diagnostic(code(mpl_lang::undefined_param))]
286    UndefinedParam {
287        /// The source location of the undefine param
288        #[label("undefined param")]
289        span: SourceSpan,
290        /// The param
291        param: String,
292    },
293    /// Invalid tag type
294    #[error("The type {tpe} is not a valid type for tags")]
295    #[diagnostic(code(mpl_lang::invalid_tag_type))]
296    InvalidTagType {
297        /// The source location of the invalid type
298        #[label("invalid type")]
299        span: miette::SourceSpan,
300        /// The invalid type
301        tpe: String,
302    },
303    /// `ifdef()` was used on a parameter that wasn't declared optional
304    #[error("The parameter {} is not declared as optional", param.name)]
305    #[diagnostic(code(mpl_lang::ifdef_not_optional))]
306    IfdefNotOptional {
307        /// The source location of the param declaration
308        #[label("param declaration")]
309        span: miette::SourceSpan,
310        /// The param type
311        param: ParamDeclaration,
312    },
313}
314
315impl From<PestError<Rule>> for ParseError {
316    fn from(err: PestError<Rule>) -> Self {
317        let (start, mut len) = match err.location {
318            InputLocation::Pos(pos) => (pos, 0),
319            InputLocation::Span((start, end)) => (start, end - start),
320        };
321
322        let (label, message, suggestion) = match &err.variant {
323            ErrorVariant::ParsingError {
324                positives,
325                negatives,
326            } => {
327                let mut keywords = Vec::new();
328                let mut operations = Vec::new();
329                let mut other = Vec::new();
330
331                for rule in positives {
332                    let name = friendly_rule(*rule);
333                    if name.contains("keyword") {
334                        keywords.push(name);
335                    } else if name.contains("operation") {
336                        operations.push(name);
337                    } else {
338                        other.push(name);
339                    }
340                }
341
342                let mut label = String::new();
343                if keywords.is_empty() && operations.is_empty() && other.is_empty() {
344                    label.push_str("unexpected token");
345                } else {
346                    label.push_str("expected one of:\n");
347                    if !keywords.is_empty() {
348                        let kws: Vec<_> = keywords
349                            .iter()
350                            .map(|k| k.trim_end_matches(" keyword"))
351                            .collect();
352                        let _ = writeln!(label, "  keywords: {}", join_with_or(&kws));
353                    }
354                    if !operations.is_empty() {
355                        let ops: Vec<_> = operations
356                            .iter()
357                            .map(|o| {
358                                o.trim_start_matches("a ")
359                                    .trim_start_matches("an ")
360                                    .trim_end_matches(" operation")
361                            })
362                            .collect();
363                        let _ = writeln!(label, "  operations: {}", join_with_or(&ops));
364                    }
365                    if !other.is_empty() {
366                        for name in &other {
367                            let _ = writeln!(label, "  - {name}");
368                        }
369                    }
370                }
371
372                let mut msg = "unexpected token or operation".to_string();
373                if !negatives.is_empty() {
374                    if !msg.is_empty() {
375                        msg.push_str("  ");
376                    }
377                    msg.push_str("but found ");
378                    msg.push_str(&friendly_rules(negatives));
379                }
380
381                let line_pos = match &err.line_col {
382                    LineColLocation::Pos((_, col)) | LineColLocation::Span((_, col), _) => {
383                        col.saturating_sub(1)
384                    }
385                };
386                let suggestion = generate_suggestion(err.line(), line_pos, positives);
387
388                // If the span is a single position, try to expand it to cover the full token
389                if len == 0 {
390                    len = token_length(err.line(), line_pos);
391                }
392
393                let label = label.trim_end().to_string();
394                (label, msg, suggestion)
395            }
396            ErrorVariant::CustomError { message } => (message.clone(), message.clone(), None),
397        };
398
399        ParseError::SyntaxError {
400            span: SourceSpan::new(start.into(), len),
401            label,
402            message,
403            suggestion,
404        }
405    }
406}
407
408/// Join a list of items with commas and "or" before the last item
409fn join_with_or(items: &[&str]) -> String {
410    match items.len() {
411        0 => String::new(),
412        1 => items[0].to_string(),
413        2 => format!("{} or {}", items[0], items[1]),
414        _ => {
415            let last = items[items.len() - 1];
416            let rest = &items[..items.len() - 1];
417            format!("{}, or {last}", rest.join(", "))
418        }
419    }
420}
421
422/// Convert a Pest `Pair` span to a miette `SourceSpan`
423pub(crate) fn pair_to_source_span(pair: &Pair<Rule>) -> SourceSpan {
424    let span = pair.as_span();
425    let start = span.start();
426    let len = span.end() - start;
427    SourceSpan::new(start.into(), len)
428}
429
430/// Convert a list of rules to a friendly name
431fn friendly_rules(rules: &[Rule]) -> String {
432    let names: Vec<_> = rules.iter().copied().map(friendly_rule).collect();
433
434    match names.len() {
435        0 => String::new(),
436        1 => names[0].clone(),
437        2 => format!("{} or {}", names[0], names[1]),
438        _ => {
439            let last = &names[names.len() - 1];
440            let rest = &names[..names.len() - 1];
441            format!("{}, or {last}", rest.join(", "))
442        }
443    }
444}
445
446/// Convert a rule to a friendly name
447fn friendly_rule(rule: Rule) -> String {
448    match rule {
449        // Control
450        Rule::EOI => "end of query".to_string(),
451        Rule::pipe_keyword => "`|` (pipe)".to_string(),
452
453        // Time
454        Rule::time_range => "time range (e.g.,  [1h..])".to_string(),
455        Rule::time_relative => "relative time (e.g., 5m, 1h, 7d)".to_string(),
456        Rule::time_timestamp => "timestamp".to_string(),
457        Rule::time_rfc_3339 => "RFC3339 timestamp".to_string(),
458        Rule::time_modifier => "time modifier".to_string(),
459
460        // Keywords
461        Rule::filter_keyword | Rule::kw_filter => "`filter` keyword".to_string(),
462        Rule::kw_where => "`where` keyword".to_string(),
463        Rule::r#as => "`as` keyword".to_string(),
464
465        // Ops
466        Rule::cmp => "a comparison operator (==, !=, <, >, <=, >=)".to_string(),
467        Rule::cmp_re => "a regex operator (==, !=)".to_string(),
468        Rule::regex => "a regex pattern (e.g., /pattern/)".to_string(),
469
470        // Values
471        Rule::value => "value (string, number, or bool)".to_string(),
472        Rule::string => "string value".to_string(),
473        Rule::number => "number".to_string(),
474        Rule::bool => "bool (true or false)".to_string(),
475
476        // Idents
477        Rule::plain_ident => "identifier".to_string(),
478        Rule::escaped_ident => "escaped identifier".to_string(),
479        Rule::source => "source metric".to_string(),
480        Rule::metric_name => "metric name".to_string(),
481        Rule::metric_id => "metric identifier (e.g., dataset:metric)".to_string(),
482        Rule::dataset => "dataset name".to_string(),
483
484        // Aggrs
485        Rule::align => "an align operation".to_string(),
486        Rule::group_by => "a group by operation".to_string(),
487        Rule::bucket_by => "a bucket by operation".to_string(),
488        Rule::map => "a map operation".to_string(),
489        Rule::replace => "a replace operation".to_string(),
490        Rule::join => "a join operation".to_string(),
491
492        // Query types
493        Rule::simple_query => "simple query".to_string(),
494        Rule::compute_query => "compute query".to_string(),
495
496        // Directives
497        Rule::directive => "directive".to_string(),
498
499        // Params
500        Rule::param => "param".to_string(),
501        Rule::param_ident => "param identifier".to_string(),
502        Rule::param_type => {
503            "param type (Duration, Dataset, Regex, string, int, float, bool)".to_string()
504        }
505
506        // Funs
507        Rule::func => "function".to_string(),
508        Rule::compute_fn => "compute function".to_string(),
509        Rule::bucket_by_fn => {
510            "bucket function (histogram, interpolate_delta_histogram)".to_string()
511        }
512        Rule::bucket_by_with_conversion_fn => {
513            "bucket function (interpolate_cumulative_histogram)".to_string()
514        }
515        Rule::bucket_conversion => "conversion method (rate, increase)".to_string(),
516        Rule::bucket_specs => "bucket specifications".to_string(),
517        Rule::bucket_fn_call | Rule::bucket_fn_call_simple => "bucket function call".to_string(),
518        Rule::bucket_fn_call_with_conversion => "bucket function call with conversion".to_string(),
519
520        // Filters
521        Rule::filter_rule => "filter rule".to_string(),
522        Rule::filter_expr => "filter expression".to_string(),
523        Rule::sample_expr => "sample expression".to_string(),
524        Rule::value_filter => "value filter".to_string(),
525        Rule::regex_filter => "regex filter".to_string(),
526        Rule::kw_is => "`is` keyword".to_string(),
527        Rule::is_filter => "type filter (e.g., is string)".to_string(),
528        Rule::tag_type => "tag type (string, int, float, or bool)".to_string(),
529
530        // Tags
531        Rule::tags => "tags (comma-separated field names)".to_string(),
532        Rule::tag => "tag name".to_string(),
533
534        // Fallback for any other rules
535        _ => {
536            let name = format!("{rule:?}");
537            name.to_lowercase().replace('_', " ")
538        }
539    }
540}
541
542/// Suggestion for typos / corrections
543#[derive(Debug, Clone)]
544pub struct Suggestion(String);
545
546impl Suggestion {
547    /// The suggested text
548    #[must_use]
549    pub fn suggestion(&self) -> &str {
550        &self.0
551    }
552}
553
554impl fmt::Display for Suggestion {
555    fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
556        write!(f, "Did you mean \"{}\"?", self.0)
557    }
558}
559
560/// Generate a suggestion for a typo based on the expected rules
561fn generate_suggestion(
562    line: &str,
563    error_pos: usize,
564    expected_rules: &[Rule],
565) -> Option<Suggestion> {
566    let actual_token = extract_token(line, error_pos)?;
567
568    if actual_token.len() < 2 {
569        return None;
570    }
571
572    let possible_keywords = rules_keywords(expected_rules);
573
574    let mut best_match: Option<(&str, f64)> = None;
575
576    for keyword in &possible_keywords {
577        let similarity = jaro(&actual_token.to_lowercase(), &keyword.to_lowercase());
578
579        if similarity > 0.8 {
580            if let Some((_, best_score)) = best_match {
581                if similarity > best_score {
582                    best_match = Some((keyword, similarity));
583                }
584            } else {
585                best_match = Some((keyword, similarity));
586            }
587        }
588    }
589
590    best_match.map(|(keyword, _)| Suggestion(keyword.to_string()))
591}
592
593/// Extract the token at the given position from the line
594fn extract_token(line: &str, pos: usize) -> Option<String> {
595    let chars: Vec<char> = line.chars().collect();
596
597    if pos >= chars.len() {
598        return None;
599    }
600
601    // Skip whitespace forward to find the next token
602    let mut pos = pos;
603    while pos < chars.len() && chars[pos].is_whitespace() {
604        pos += 1;
605    }
606
607    if pos >= chars.len() {
608        return None;
609    }
610
611    // Find the start of the token (go backwards)
612    let mut start = pos;
613    while start > 0 && chars[start - 1].is_alphanumeric() {
614        start -= 1;
615    }
616
617    // Find the end of the token (go forwards)
618    let mut end = pos;
619    while end < chars.len() && chars[end].is_alphanumeric() {
620        end += 1;
621    }
622
623    if start < end {
624        Some(chars[start..end].iter().collect())
625    } else {
626        None
627    }
628}
629
630/// Extract the length of the token at the given position
631fn token_length(line: &str, pos: usize) -> usize {
632    let chars: Vec<char> = line.chars().collect();
633
634    if pos >= chars.len() {
635        return 0;
636    }
637
638    if !chars[pos].is_alphanumeric() {
639        return 1;
640    }
641
642    let mut end = pos;
643    while end < chars.len() && chars[end].is_alphanumeric() {
644        end += 1;
645    }
646
647    end - pos
648}
649
650/// Get a list of common keywords that correspond to a list of rules
651fn rules_keywords(rules: &[Rule]) -> Vec<&'static str> {
652    let mut keywords = Vec::new();
653
654    for rule in rules {
655        match rule {
656            Rule::filter_keyword | Rule::kw_filter | Rule::kw_where => {
657                keywords.push("where");
658                keywords.push("filter");
659            }
660            Rule::r#as => keywords.push("as"),
661            Rule::align => keywords.push("align"),
662            Rule::group_by => keywords.push("group"),
663            Rule::bucket_by => keywords.push("bucket"),
664            Rule::map => keywords.push("map"),
665            Rule::replace => keywords.push("replace"),
666            Rule::join => keywords.push("join"),
667            Rule::kw_is => keywords.push("is"),
668            Rule::tag_type => {
669                keywords.push("string");
670                keywords.push("int");
671                keywords.push("float");
672                keywords.push("bool");
673            }
674            _ => {}
675        }
676    }
677
678    keywords
679}