1#![allow(unused_assignments)] use std::fmt::{self, Write as _};
5
6use miette::{Diagnostic, SourceSpan};
7use pest::{
8 error::{Error as PestError, ErrorVariant, InputLocation, LineColLocation},
9 iterators::Pair,
10};
11use strsim::jaro;
12
13use crate::{parser::Rule, query::ParamDeclaration};
14
15#[derive(thiserror::Error, Debug, Diagnostic)]
17pub enum ParseError {
18 #[error("MPL syntax error: {message}")]
20 #[diagnostic(code(mpl_lang::syntax_error))]
21 SyntaxError {
22 #[label("{label}")]
24 span: SourceSpan,
25 label: String,
27 message: String,
29 #[help]
31 suggestion: Option<Suggestion>,
32 },
33
34 #[error("This feature is not supported at the moment: {rule:?}")]
35 #[diagnostic(
37 code(mpl_lang::not_supported),
38 help("This feature may be added in a future version")
39 )]
40 NotSupported {
41 #[label("unsupported: {rule:?}")]
43 span: SourceSpan,
44 rule: Rule,
46 },
47
48 #[error("Unexpected rule: {rule:?} expected one of {expected:?}")]
50 #[diagnostic(code(mpl_lang::unexpected_rule))]
51 Unexpected {
52 #[label("unexpected {rule:?}")]
54 span: SourceSpan,
55 rule: Rule,
57 expected: Vec<Rule>,
59 },
60
61 #[error("Found unexpected tokens: {rules:?}")]
63 #[diagnostic(code(mpl_lang::unexpected_tokens))]
64 UnexpectedTokens {
65 #[label("unexpected tokens")]
67 span: SourceSpan,
68 rules: Vec<Rule>,
70 },
71
72 #[error("Unexpected end of input")]
74 #[diagnostic(
75 code(mpl_lang::unexpected_eof),
76 help("The query appears to be incomplete")
77 )]
78 EOF {
79 #[label("expected more input here")]
81 span: SourceSpan,
82 },
83
84 #[error("Invalid float: {0}")]
86 #[diagnostic(code(mpl_lang::invalid_float))]
87 InvalidFloat(#[from] std::num::ParseFloatError),
88
89 #[error("Invalid integer: {0}")]
91 #[diagnostic(code(mpl_lang::invalid_integer))]
92 InvalidInteger(#[from] std::num::ParseIntError),
93
94 #[error("Invalid bool: {0}")]
96 #[diagnostic(code(mpl_lang::invalid_bool))]
97 InvalidBool(#[from] std::str::ParseBoolError),
98
99 #[error("Invalid date: {0}")]
101 #[diagnostic(code(mpl_lang::invalid_date))]
102 InvalidDate(#[from] chrono::ParseError),
103
104 #[error("Invalid Regex: {0}")]
106 #[diagnostic(code(mpl_lang::invalid_regex))]
107 InvalidRegex(#[from] regex::Error),
108
109 #[error("Unsupported align function: {name}")]
111 #[diagnostic(
112 code(mpl_lang::unsupported_align_function),
113 help("Check the documentation for available align functions")
114 )]
115 UnsupportedAlignFunction {
116 #[label("unknown function")]
118 span: SourceSpan,
119 name: String,
121 },
122
123 #[error("Unsupported group function: {name}")]
125 #[diagnostic(
126 code(mpl_lang::unsupported_group_function),
127 help("Check the documentation for available group functions")
128 )]
129 UnsupportedGroupFunction {
130 #[label("unknown function")]
132 span: SourceSpan,
133 name: String,
135 },
136
137 #[error("Unsupported compute function: {name}")]
139 #[diagnostic(
140 code(mpl_lang::unsupported_compute_function),
141 help("Check the documentation for available compute functions")
142 )]
143 UnsupportedComputeFunction {
144 #[label("unknown function")]
146 span: SourceSpan,
147 name: String,
149 },
150
151 #[error("Unsupported bucket function: {name}")]
153 #[diagnostic(
154 code(mpl_lang::unsupported_bucket_function),
155 help(
156 "Available functions: histogram, interpolate_delta_histogram, interpolate_cumulative_histogram"
157 )
158 )]
159 UnsupportedBucketFunction {
160 #[label("unknown function")]
162 span: SourceSpan,
163 name: String,
165 },
166
167 #[error("Unsupported map evaluation: {name}")]
169 #[diagnostic(
170 code(mpl_lang::unsupported_map_evaluation),
171 help("Check the documentation for available map operations")
172 )]
173 UnsupportedMapEvaluation {
174 #[label("unknown operation")]
176 span: SourceSpan,
177 name: String,
179 },
180
181 #[error("Unsupported map function: {name}")]
183 #[diagnostic(
184 code(mpl_lang::unsupported_map_function),
185 help("Check the documentation for available map functions")
186 )]
187 UnsupportedMapFunction {
188 #[label("unknown function")]
190 span: SourceSpan,
191 name: String,
193 },
194
195 #[error("Unsupported regexp comparison: {op}")]
197 #[diagnostic(
198 code(mpl_lang::unsupported_regexp_comparison),
199 help("Use '==' or '!=' for regex comparisons")
200 )]
201 UnsupportedRegexpComparison {
202 #[label("invalid operator")]
204 span: SourceSpan,
205 op: String,
207 },
208
209 #[error("Unsupported tag comparison: {op}")]
211 #[diagnostic(
212 code(mpl_lang::unsupported_tag_comparison),
213 help("Supported operators: ==, !=, >, >=, <, <=")
214 )]
215 UnsupportedTagComparison {
216 #[label("invalid operator")]
218 span: SourceSpan,
219 op: String,
221 },
222
223 #[error("Not implemented: {0}")]
225 #[diagnostic(
226 code(mpl_lang::not_implemented),
227 help("This feature is planned but not yet implemented")
228 )]
229 NotImplemented(&'static str),
230
231 #[error("String construction error: {0}")]
233 #[diagnostic(code(mpl_lang::strumbra_error))]
234 StrumbraError(#[from] strumbra::Error),
235
236 #[error("Unreachable error: {0}")]
238 #[diagnostic(
239 code(mpl_lang::unreachable),
240 help("This error should never be reached")
241 )]
242 Unreachable(&'static str),
243
244 #[error("The param ${param} is defined multiple times")]
246 #[diagnostic(
247 code(mpl_lang::param_defined_multiple_times),
248 help("This param has been defined more than once")
249 )]
250 ParamDefinedMultipleTimes {
251 #[label("duplicate definition")]
253 span: SourceSpan,
254 param: String,
256 },
257
258 #[error("The system param ${param} is missing the system prefix")]
274 #[diagnostic(
275 code(mpl_lan::system_param_missing_prefix),
276 help("The system param is missing the `__` prefix")
277 )]
278 SystemParamMissingPrefix {
279 param: String,
281 },
282
283 #[error("The param ${param} is not defined")]
285 #[diagnostic(code(mpl_lang::undefined_param))]
286 UndefinedParam {
287 #[label("undefined param")]
289 span: SourceSpan,
290 param: String,
292 },
293 #[error("The type {tpe} is not a valid type for tags")]
295 #[diagnostic(code(mpl_lang::invalid_tag_type))]
296 InvalidTagType {
297 #[label("invalid type")]
299 span: miette::SourceSpan,
300 tpe: String,
302 },
303 #[error("The parameter {} is not declared as optional", param.name)]
305 #[diagnostic(code(mpl_lang::ifdef_not_optional))]
306 IfdefNotOptional {
307 #[label("param declaration")]
309 span: miette::SourceSpan,
310 param: ParamDeclaration,
312 },
313}
314
315impl From<PestError<Rule>> for ParseError {
316 fn from(err: PestError<Rule>) -> Self {
317 let (start, mut len) = match err.location {
318 InputLocation::Pos(pos) => (pos, 0),
319 InputLocation::Span((start, end)) => (start, end - start),
320 };
321
322 let (label, message, suggestion) = match &err.variant {
323 ErrorVariant::ParsingError {
324 positives,
325 negatives,
326 } => {
327 let mut keywords = Vec::new();
328 let mut operations = Vec::new();
329 let mut other = Vec::new();
330
331 for rule in positives {
332 let name = friendly_rule(*rule);
333 if name.contains("keyword") {
334 keywords.push(name);
335 } else if name.contains("operation") {
336 operations.push(name);
337 } else {
338 other.push(name);
339 }
340 }
341
342 let mut label = String::new();
343 if keywords.is_empty() && operations.is_empty() && other.is_empty() {
344 label.push_str("unexpected token");
345 } else {
346 label.push_str("expected one of:\n");
347 if !keywords.is_empty() {
348 let kws: Vec<_> = keywords
349 .iter()
350 .map(|k| k.trim_end_matches(" keyword"))
351 .collect();
352 let _ = writeln!(label, " keywords: {}", join_with_or(&kws));
353 }
354 if !operations.is_empty() {
355 let ops: Vec<_> = operations
356 .iter()
357 .map(|o| {
358 o.trim_start_matches("a ")
359 .trim_start_matches("an ")
360 .trim_end_matches(" operation")
361 })
362 .collect();
363 let _ = writeln!(label, " operations: {}", join_with_or(&ops));
364 }
365 if !other.is_empty() {
366 for name in &other {
367 let _ = writeln!(label, " - {name}");
368 }
369 }
370 }
371
372 let mut msg = "unexpected token or operation".to_string();
373 if !negatives.is_empty() {
374 if !msg.is_empty() {
375 msg.push_str(" ");
376 }
377 msg.push_str("but found ");
378 msg.push_str(&friendly_rules(negatives));
379 }
380
381 let line_pos = match &err.line_col {
382 LineColLocation::Pos((_, col)) | LineColLocation::Span((_, col), _) => {
383 col.saturating_sub(1)
384 }
385 };
386 let suggestion = generate_suggestion(err.line(), line_pos, positives);
387
388 if len == 0 {
390 len = token_length(err.line(), line_pos);
391 }
392
393 let label = label.trim_end().to_string();
394 (label, msg, suggestion)
395 }
396 ErrorVariant::CustomError { message } => (message.clone(), message.clone(), None),
397 };
398
399 ParseError::SyntaxError {
400 span: SourceSpan::new(start.into(), len),
401 label,
402 message,
403 suggestion,
404 }
405 }
406}
407
408fn join_with_or(items: &[&str]) -> String {
410 match items.len() {
411 0 => String::new(),
412 1 => items[0].to_string(),
413 2 => format!("{} or {}", items[0], items[1]),
414 _ => {
415 let last = items[items.len() - 1];
416 let rest = &items[..items.len() - 1];
417 format!("{}, or {last}", rest.join(", "))
418 }
419 }
420}
421
422pub(crate) fn pair_to_source_span(pair: &Pair<Rule>) -> SourceSpan {
424 let span = pair.as_span();
425 let start = span.start();
426 let len = span.end() - start;
427 SourceSpan::new(start.into(), len)
428}
429
430fn friendly_rules(rules: &[Rule]) -> String {
432 let names: Vec<_> = rules.iter().copied().map(friendly_rule).collect();
433
434 match names.len() {
435 0 => String::new(),
436 1 => names[0].clone(),
437 2 => format!("{} or {}", names[0], names[1]),
438 _ => {
439 let last = &names[names.len() - 1];
440 let rest = &names[..names.len() - 1];
441 format!("{}, or {last}", rest.join(", "))
442 }
443 }
444}
445
446fn friendly_rule(rule: Rule) -> String {
448 match rule {
449 Rule::EOI => "end of query".to_string(),
451 Rule::pipe_keyword => "`|` (pipe)".to_string(),
452
453 Rule::time_range => "time range (e.g., [1h..])".to_string(),
455 Rule::time_relative => "relative time (e.g., 5m, 1h, 7d)".to_string(),
456 Rule::time_timestamp => "timestamp".to_string(),
457 Rule::time_rfc_3339 => "RFC3339 timestamp".to_string(),
458 Rule::time_modifier => "time modifier".to_string(),
459
460 Rule::filter_keyword | Rule::kw_filter => "`filter` keyword".to_string(),
462 Rule::kw_where => "`where` keyword".to_string(),
463 Rule::r#as => "`as` keyword".to_string(),
464
465 Rule::cmp => "a comparison operator (==, !=, <, >, <=, >=)".to_string(),
467 Rule::cmp_re => "a regex operator (==, !=)".to_string(),
468 Rule::regex => "a regex pattern (e.g., /pattern/)".to_string(),
469
470 Rule::value => "value (string, number, or bool)".to_string(),
472 Rule::string => "string value".to_string(),
473 Rule::number => "number".to_string(),
474 Rule::bool => "bool (true or false)".to_string(),
475
476 Rule::plain_ident => "identifier".to_string(),
478 Rule::escaped_ident => "escaped identifier".to_string(),
479 Rule::source => "source metric".to_string(),
480 Rule::metric_name => "metric name".to_string(),
481 Rule::metric_id => "metric identifier (e.g., dataset:metric)".to_string(),
482 Rule::dataset => "dataset name".to_string(),
483
484 Rule::align => "an align operation".to_string(),
486 Rule::group_by => "a group by operation".to_string(),
487 Rule::bucket_by => "a bucket by operation".to_string(),
488 Rule::map => "a map operation".to_string(),
489 Rule::replace => "a replace operation".to_string(),
490 Rule::join => "a join operation".to_string(),
491
492 Rule::simple_query => "simple query".to_string(),
494 Rule::compute_query => "compute query".to_string(),
495
496 Rule::directive => "directive".to_string(),
498
499 Rule::param => "param".to_string(),
501 Rule::param_ident => "param identifier".to_string(),
502 Rule::param_type => {
503 "param type (Duration, Dataset, Regex, string, int, float, bool)".to_string()
504 }
505
506 Rule::func => "function".to_string(),
508 Rule::compute_fn => "compute function".to_string(),
509 Rule::bucket_by_fn => {
510 "bucket function (histogram, interpolate_delta_histogram)".to_string()
511 }
512 Rule::bucket_by_with_conversion_fn => {
513 "bucket function (interpolate_cumulative_histogram)".to_string()
514 }
515 Rule::bucket_conversion => "conversion method (rate, increase)".to_string(),
516 Rule::bucket_specs => "bucket specifications".to_string(),
517 Rule::bucket_fn_call | Rule::bucket_fn_call_simple => "bucket function call".to_string(),
518 Rule::bucket_fn_call_with_conversion => "bucket function call with conversion".to_string(),
519
520 Rule::filter_rule => "filter rule".to_string(),
522 Rule::filter_expr => "filter expression".to_string(),
523 Rule::sample_expr => "sample expression".to_string(),
524 Rule::value_filter => "value filter".to_string(),
525 Rule::regex_filter => "regex filter".to_string(),
526 Rule::kw_is => "`is` keyword".to_string(),
527 Rule::is_filter => "type filter (e.g., is string)".to_string(),
528 Rule::tag_type => "tag type (string, int, float, or bool)".to_string(),
529
530 Rule::tags => "tags (comma-separated field names)".to_string(),
532 Rule::tag => "tag name".to_string(),
533
534 _ => {
536 let name = format!("{rule:?}");
537 name.to_lowercase().replace('_', " ")
538 }
539 }
540}
541
542#[derive(Debug, Clone)]
544pub struct Suggestion(String);
545
546impl Suggestion {
547 #[must_use]
549 pub fn suggestion(&self) -> &str {
550 &self.0
551 }
552}
553
554impl fmt::Display for Suggestion {
555 fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
556 write!(f, "Did you mean \"{}\"?", self.0)
557 }
558}
559
560fn generate_suggestion(
562 line: &str,
563 error_pos: usize,
564 expected_rules: &[Rule],
565) -> Option<Suggestion> {
566 let actual_token = extract_token(line, error_pos)?;
567
568 if actual_token.len() < 2 {
569 return None;
570 }
571
572 let possible_keywords = rules_keywords(expected_rules);
573
574 let mut best_match: Option<(&str, f64)> = None;
575
576 for keyword in &possible_keywords {
577 let similarity = jaro(&actual_token.to_lowercase(), &keyword.to_lowercase());
578
579 if similarity > 0.8 {
580 if let Some((_, best_score)) = best_match {
581 if similarity > best_score {
582 best_match = Some((keyword, similarity));
583 }
584 } else {
585 best_match = Some((keyword, similarity));
586 }
587 }
588 }
589
590 best_match.map(|(keyword, _)| Suggestion(keyword.to_string()))
591}
592
593fn extract_token(line: &str, pos: usize) -> Option<String> {
595 let chars: Vec<char> = line.chars().collect();
596
597 if pos >= chars.len() {
598 return None;
599 }
600
601 let mut pos = pos;
603 while pos < chars.len() && chars[pos].is_whitespace() {
604 pos += 1;
605 }
606
607 if pos >= chars.len() {
608 return None;
609 }
610
611 let mut start = pos;
613 while start > 0 && chars[start - 1].is_alphanumeric() {
614 start -= 1;
615 }
616
617 let mut end = pos;
619 while end < chars.len() && chars[end].is_alphanumeric() {
620 end += 1;
621 }
622
623 if start < end {
624 Some(chars[start..end].iter().collect())
625 } else {
626 None
627 }
628}
629
630fn token_length(line: &str, pos: usize) -> usize {
632 let chars: Vec<char> = line.chars().collect();
633
634 if pos >= chars.len() {
635 return 0;
636 }
637
638 if !chars[pos].is_alphanumeric() {
639 return 1;
640 }
641
642 let mut end = pos;
643 while end < chars.len() && chars[end].is_alphanumeric() {
644 end += 1;
645 }
646
647 end - pos
648}
649
650fn rules_keywords(rules: &[Rule]) -> Vec<&'static str> {
652 let mut keywords = Vec::new();
653
654 for rule in rules {
655 match rule {
656 Rule::filter_keyword | Rule::kw_filter | Rule::kw_where => {
657 keywords.push("where");
658 keywords.push("filter");
659 }
660 Rule::r#as => keywords.push("as"),
661 Rule::align => keywords.push("align"),
662 Rule::group_by => keywords.push("group"),
663 Rule::bucket_by => keywords.push("bucket"),
664 Rule::map => keywords.push("map"),
665 Rule::replace => keywords.push("replace"),
666 Rule::join => keywords.push("join"),
667 Rule::kw_is => keywords.push("is"),
668 Rule::tag_type => {
669 keywords.push("string");
670 keywords.push("int");
671 keywords.push("float");
672 keywords.push("bool");
673 }
674 _ => {}
675 }
676 }
677
678 keywords
679}