Skip to main content

mech_syntax/
mechdown.rs

1#[macro_use]
2use crate::*;
3
4#[cfg(not(feature = "no-std"))] use core::fmt;
5#[cfg(feature = "no-std")] use alloc::fmt;
6#[cfg(feature = "no-std")] use alloc::string::String;
7#[cfg(feature = "no-std")] use alloc::vec::Vec;
8use nom::{
9  IResult,
10  branch::alt,
11  sequence::{tuple as nom_tuple, pair},
12  combinator::{opt, eof, peek},
13  multi::{many1, many_till, many0, separated_list1,separated_list0},
14  bytes::complete::{take_until, take_while},
15  Err,
16  Err::Failure
17};
18
19use std::collections::HashMap;
20use colored::*;
21
22use crate::*;
23
24// Mechdown
25// ============================================================================
26
27// title := +text, new-line, +equal, *(space|tab), *whitespace ;
28pub fn title(input: ParseString) -> ParseResult<Title> {
29  let (input, mut text) = many1(text)(input)?;
30  let (input, _) = new_line(input)?;
31  let (input, _) = many1(equal)(input)?;
32  let (input, _) = whitespace0(input)?;
33  let (input, byline) = opt(byline)(input)?;
34  let mut title = Token::merge_tokens(&mut text).unwrap();
35  title.kind = TokenKind::Title;
36  Ok((input, Title{text: title, byline}))
37}
38
39pub fn byline(input: ParseString) -> ParseResult<Paragraph> {
40  let (input, byline) = paragraph_newline(input)?;
41  let (input, _) = many1(equal)(input)?;
42  Ok((input, byline))
43}
44
45pub struct MarkdownTableHeader {
46  pub header: Vec<(Token, Token)>,
47}
48
49pub fn no_alignment(input: ParseString) -> ParseResult<ColumnAlignment> {
50  let (input, _) = many1(dash)(input)?;
51  Ok((input, ColumnAlignment::Left))
52}
53
54pub fn left_alignment(input: ParseString) -> ParseResult<ColumnAlignment> {
55  let (input, _) = colon(input)?;
56  let (input, _) = many1(dash)(input)?;
57  Ok((input, ColumnAlignment::Left))
58}
59
60pub fn right_alignment(input: ParseString) -> ParseResult<ColumnAlignment> {
61  let (input, _) = many1(dash)(input)?;
62  let (input, _) = colon(input)?;
63  Ok((input, ColumnAlignment::Right))
64}
65
66pub fn center_alignment(input: ParseString) -> ParseResult<ColumnAlignment> {
67  let (input, _) = colon(input)?;
68  let (input, _) = many1(dash)(input)?;
69  let (input, _) = colon(input)?;
70  Ok((input, ColumnAlignment::Center))
71}
72
73pub fn alignment_separator(input: ParseString) -> ParseResult<ColumnAlignment> {
74  let (input, _) = many0(space_tab)(input)?;
75  let (input, separator) = alt((center_alignment, left_alignment, right_alignment, no_alignment))(input)?;
76  let (input, _) = many0(space_tab)(input)?;
77  Ok((input, separator))
78}
79
80pub fn mechdown_table(input: ParseString) -> ParseResult<MarkdownTable> {
81  let (input, _) = whitespace0(input)?;
82  let (input, table) = alt((mechdown_table_with_header, mechdown_table_no_header))(input)?;
83  Ok((input, table))
84}
85
86pub fn mechdown_table_with_header(input: ParseString) -> ParseResult<MarkdownTable> {
87  let (input, (header,alignment)) = mechdown_table_header(input)?;
88  let (input, rows) = many1(mechdown_table_row)(input)?;
89  Ok((input, MarkdownTable{header, rows, alignment}))
90}
91
92pub fn mechdown_table_no_header(input: ParseString) -> ParseResult<MarkdownTable> {
93  let (input, rows) = many1(mechdown_table_row)(input)?;
94  let header = vec![];
95  let alignment = vec![];
96  Ok((input, MarkdownTable{header, rows, alignment}))
97}
98
99pub fn mechdown_table_header(input: ParseString) -> ParseResult<(Vec<Paragraph>,Vec<ColumnAlignment>)> {
100  let (input, _) = whitespace0(input)?;
101  let (input, header) = many1(tuple((bar, tuple((many0(space_tab), inline_paragraph)))))(input)?;
102  let (input, _) = bar(input)?;
103  let (input, _) = whitespace0(input)?;
104  let (input, alignment) = many1(tuple((bar, tuple((many0(space_tab), alignment_separator)))))(input)?;
105  let (input, _) = bar(input)?;
106  let (input, _) = whitespace0(input)?;
107  let column_names: Vec<Paragraph> = header.into_iter().map(|(_,(_,tkn))| tkn).collect();
108  let column_alignments = alignment.into_iter().map(|(_,(_,tkn))| tkn).collect();
109  Ok((input, (column_names,column_alignments)))
110}
111
112pub fn empty_paragraph(input: ParseString) -> ParseResult<Paragraph> {
113  Ok((input, Paragraph{elements: vec![], error_range: None}))
114}
115
116// mechdown_table_row := +(bar, paragraph), bar, *whitespace ;
117pub fn mechdown_table_row(input: ParseString) -> ParseResult<Vec<Paragraph>> {
118  let (input, _) = whitespace0(input)?;
119  let (input, _) = bar(input)?;
120  let (input, row) = many1(tuple((alt((tuple((many0(space_tab), inline_paragraph)),tuple((many1(space_tab), empty_paragraph)))),bar)))(input)?;
121  let (input, _) = whitespace0(input)?;
122  let row = row.into_iter().map(|((_,tkn),_)| tkn).collect();
123  Ok((input, row))
124}
125
126// subtitle := +(digit | alpha), period, *space-tab, paragraph-newline, *space-tab, whitespace* ;
127pub fn ul_subtitle(input: ParseString) -> ParseResult<Subtitle> {
128  let (input, _) = many1((alt((digit_token, alpha_token))))(input)?;
129  let (input, _) = period(input)?;
130  let (input, _) = many0(space_tab)(input)?;
131  let (input, text) = paragraph_newline(input)?;
132  let (input, _) = many1(dash)(input)?;
133  let (input, _) = many0(space_tab)(input)?;
134  let (input, _) = new_line(input)?;
135  let (input, _) = many0(space_tab)(input)?;
136  let (input, _) = whitespace0(input)?;
137  Ok((input, Subtitle{text, level: 2}))
138}
139
140// subtitle := *(space-tab), "(", +(alpha | digit | period), ")", *(space-tab), paragraph-newline, *(space-tab), whitespace* ;
141pub fn subtitle(input: ParseString) -> ParseResult<Subtitle> {
142  let (input, _) = peek(is_not(alt((error_sigil, info_sigil))))(input)?;
143  let (input, _) = many0(space_tab)(input)?;
144  let (input, _) = left_parenthesis(input)?;
145  let (input, num) = separated_list1(period,alt((many1(alpha),many1(digit))))(input)?;
146  let (input, _) = right_parenthesis(input)?;
147  let (input, _) = many0(space_tab)(input)?;
148  let (input, text) = paragraph_newline(input)?;
149  let (input, _) = many0(space_tab)(input)?;
150  let (input, _) = whitespace0(input)?;
151  let level: u8 = if num.len() < 3 { 3 } else { num.len() as u8 + 1 };
152  Ok((input, Subtitle{text, level}))
153}
154
155// strong := (asterisk, asterisk), +paragraph-element, (asterisk, asterisk) ;
156pub fn strong(input: ParseString) -> ParseResult<ParagraphElement> {
157  let (input, _) = tuple((asterisk,asterisk))(input)?;
158  let (input, text) = paragraph_element(input)?;
159  let (input, _) = tuple((asterisk,asterisk))(input)?;
160  Ok((input, ParagraphElement::Strong(Box::new(text))))
161}
162
163/// emphasis := asterisk, +paragraph-element, asterisk ;
164pub fn emphasis(input: ParseString) -> ParseResult<ParagraphElement> {
165  let (input, _) = asterisk(input)?;
166  let (input, text) = paragraph_element(input)?;
167  let (input, _) = asterisk(input)?;
168  Ok((input, ParagraphElement::Emphasis(Box::new(text))))
169}
170
171// strikethrough := tilde, +paragraph-element, tilde ;
172pub fn strikethrough(input: ParseString) -> ParseResult<ParagraphElement> {
173  let (input, _) = tilde(input)?;
174  let (input, text) = paragraph_element(input)?;
175  let (input, _) = tilde(input)?;
176  Ok((input, ParagraphElement::Strikethrough(Box::new(text))))
177}
178
179/// underline := underscore, +paragraph-element, underscore ;
180pub fn underline(input: ParseString) -> ParseResult<ParagraphElement> {
181  let (input, _) = underscore(input)?;
182  let (input, text) = paragraph_element(input)?;
183  let (input, _) = underscore(input)?;
184  Ok((input, ParagraphElement::Underline(Box::new(text))))
185}
186
187/// highlight := "!!", +paragraph-element, "!!" ;
188pub fn highlight(input: ParseString) -> ParseResult<ParagraphElement> {
189  let (input, _) = highlight_sigil(input)?;
190  let (input, text) = paragraph_element(input)?;
191  let (input, _) = highlight_sigil(input)?;
192  Ok((input, ParagraphElement::Highlight(Box::new(text))))
193}
194
195// inline-code := grave, +text, grave ; 
196pub fn inline_code(input: ParseString) -> ParseResult<ParagraphElement> {
197  let (input, _) = is_not(grave_codeblock_sigil)(input)?; // prevent matching code fences
198  let (input, _) = grave(input)?;
199  let (input, text) = many0(tuple((is_not(grave),text)))(input)?;
200  let (input, _) = grave(input)?;
201  let mut text = text.into_iter().map(|(_,tkn)| tkn).collect();
202  // return empty token if there's nothing between the graves
203  let mut text = match Token::merge_tokens(&mut text) {
204    Some(t) => t,
205    None => {
206      return Ok((input, ParagraphElement::InlineCode(Token::default())));
207    }
208  };
209  text.kind = TokenKind::Text;
210  Ok((input, ParagraphElement::InlineCode(text)))
211}
212
213// inline-equation := equation-sigil, +text, equation-sigil ;
214pub fn inline_equation(input: ParseString) -> ParseResult<ParagraphElement> {
215  let (input, _) = equation_sigil(input)?;
216  let (input, txt) = many0(tuple((is_not(equation_sigil),alt((backslash,text)))))(input)?;
217  let (input, _) = equation_sigil(input)?;
218  let mut txt = txt.into_iter().map(|(_,tkn)| tkn).collect();
219  let mut eqn = Token::merge_tokens(&mut txt).unwrap();
220  eqn.kind = TokenKind::Text;
221  Ok((input, ParagraphElement::InlineEquation(eqn)))
222}
223
224// hyperlink := "[", +text, "]", "(", +text, ")" ;
225pub fn hyperlink(input: ParseString) -> ParseResult<ParagraphElement> {
226  let (input, _) = left_bracket(input)?;
227  let (input, link_text) = inline_paragraph(input)?;
228  let (input, _) = right_bracket(input)?;
229  let (input, _) = left_parenthesis(input)?;
230  let (input, link) = many1(tuple((is_not(right_parenthesis),text)))(input)?;
231  let (input, _) = right_parenthesis(input)?;
232  let mut tokens = link.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>();
233  let link_merged = Token::merge_tokens(&mut tokens).unwrap();
234  Ok((input, ParagraphElement::Hyperlink((link_text, link_merged))))
235}
236
237// raw-hyperlink := http-prefix, +text ;
238pub fn raw_hyperlink(input: ParseString) -> ParseResult<ParagraphElement> {
239  let (input, _) = peek(http_prefix)(input)?;
240  let (input, address) = many1(tuple((is_not(space), text)))(input)?;
241  let mut tokens = address.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>();
242  let url_token = Token::merge_tokens(&mut tokens).unwrap();
243  let url_paragraph = Paragraph::from_tokens(vec![url_token.clone()]);
244  Ok((input, ParagraphElement::Hyperlink((url_paragraph, url_token))))
245}
246
247// option-map := "{", whitespace*, mapping*, whitespace*, "}" ;
248pub fn option_map(input: ParseString) -> ParseResult<OptionMap> {
249  let msg = "Expects right bracket '}' to terminate map.";
250  let (input, (_, r)) = range(left_brace)(input)?;
251  let (input, _) = whitespace0(input)?;
252  let (input, elements) = many1(option_mapping)(input)?;
253  let (input, _) = whitespace0(input)?;
254  let (input, _) = label!(right_brace, msg, r)(input)?;
255  Ok((input, OptionMap{elements}))
256}
257
258// option-mapping :=  whitespace*, expression, whitespace*, ":", whitespace*, expression, comma?, whitespace* ;
259pub fn option_mapping(input: ParseString) -> ParseResult<(Identifier, MechString)> {
260  let msg1 = "Unexpected space before colon ':'";
261  let msg2 = "Expects a value";
262  let msg3 = "Expects whitespace or comma followed by whitespace";
263  let msg4 = "Expects whitespace";
264  let (input, _) = whitespace0(input)?;
265  let (input, key) = identifier(input)?;
266  let (input, _) = whitespace0(input)?;
267  let (input, _) = colon(input)?;
268  let (input, _) = whitespace0(input)?;
269  let (input, value) = string(input)?;
270  let (input, _) = whitespace0(input)?;
271  let (input, _) = opt(comma)(input)?;
272  let (input, _) = whitespace0(input)?;
273  Ok((input, (key, value)))
274}
275
276// img := "![", *text, "]", "(", +text, ")" , ?option-map ;
277pub fn img(input: ParseString) -> ParseResult<Image> {
278  let (input, _) = img_prefix(input)?;
279  let (input, caption_text) = opt(inline_paragraph)(input)?;
280  let (input, _) = right_bracket(input)?;
281  let (input, _) = left_parenthesis(input)?;
282  let (input, src) = many1(tuple((is_not(right_parenthesis),text)))(input)?;
283  let (input, _) = right_parenthesis(input)?;
284  let (input, style) = opt(option_map)(input)?;
285  let merged_src = Token::merge_tokens(&mut src.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>()).unwrap();
286  Ok((input, Image{src: merged_src, caption: caption_text, style}))
287}
288
289// paragraph-text := ¬(img-prefix | http-prefix | left-bracket | tilde | asterisk | underscore | grave | define-operator | bar), +text ;
290pub fn paragraph_text(input: ParseString) -> ParseResult<ParagraphElement> {
291  let (input, elements) = match many1(nom_tuple((is_not(alt((section_sigil, footnote_prefix, highlight_sigil, equation_sigil, img_prefix, http_prefix, left_brace, left_bracket, left_angle, right_bracket, tilde, asterisk, underscore, grave, define_operator, bar, mika_section_open, mika_section_close))),text)))(input) {
292    Ok((input, mut text)) => {
293      let mut text = text.into_iter().map(|(_,tkn)| tkn).collect();
294      let mut text = Token::merge_tokens(&mut text).unwrap();
295      text.kind = TokenKind::Text;
296      (input, ParagraphElement::Text(text))
297    }, 
298    Err(err) => {return Err(err);},
299  };
300  Ok((input, elements))
301}
302
303// eval-inline-mech-code := "{", ws0, expression, ws0, "}" ;`
304pub fn eval_inline_mech_code(input: ParseString) -> ParseResult<ParagraphElement> {
305  let (input, _) = left_brace(input)?;
306  let (input, _) = whitespace0(input)?;
307  let (input, expr) = expression(input)?;
308  let (input, _) = whitespace0(input)?;
309  let (input, _) = right_brace(input)?;
310  Ok((input, ParagraphElement::EvalInlineMechCode(expr)))
311}
312
313// inline-mech-code := "{{", ws0, expression, ws0, "}}" ;`
314pub fn inline_mech_code(input: ParseString) -> ParseResult<ParagraphElement> {
315  let (input, _) = left_brace(input)?;
316  let (input, _) = left_brace(input)?;
317  let (input, _) = whitespace0(input)?;
318  let (input, expr) = mech_code_alt(input)?;
319  let (input, _) = whitespace0(input)?;
320  let (input, _) = right_brace(input)?;
321  let (input, _) = right_brace(input)?;
322  Ok((input, ParagraphElement::InlineMechCode(expr)))
323}
324
325// footnote-reference := "[^", +text, "]" ;
326pub fn footnote_reference(input: ParseString) -> ParseResult<ParagraphElement> {
327  let (input, _) = footnote_prefix(input)?;
328  let (input, text) = many1(tuple((is_not(right_bracket),text)))(input)?;
329  let (input, _) = right_bracket(input)?;
330  let mut tokens = text.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>();
331  let footnote_text = Token::merge_tokens(&mut tokens).unwrap();
332  Ok((input, ParagraphElement::FootnoteReference(footnote_text)))
333}
334
335// reference := "[", +alphanumeric, "]" ;
336pub fn reference(input: ParseString) -> ParseResult<ParagraphElement> {
337  let (input, _) = left_bracket(input)?;
338  let (input, mut txt) = many1(alphanumeric)(input)?;
339  let (input, _) = right_bracket(input)?;
340  let ref_text = Token::merge_tokens(&mut txt).unwrap();
341  Ok((input, ParagraphElement::Reference(ref_text)))
342}
343
344// section_ref := "§" , +(alphanumeric | period) ;
345pub fn section_reference(input: ParseString) -> ParseResult<ParagraphElement> {
346  let (input, _) = section_sigil(input)?;
347  let (input, mut txt) = many1(alt((alphanumeric, period)))(input)?;
348  let section_text = Token::merge_tokens(&mut txt).unwrap();
349  Ok((input, ParagraphElement::SectionReference(section_text)))
350}
351
352// paragraph-element := hyperlink | reference | section-ref | raw-hyperlink | highlight | footnote-reference | inline-mech-code | eval-inline-mech-code | inline-equation | paragraph-text | strong | highlight | emphasis | inline-code | strikethrough | underline ;
353pub fn paragraph_element(input: ParseString) -> ParseResult<ParagraphElement> {
354  alt((hyperlink, reference, section_reference, raw_hyperlink, highlight, footnote_reference, inline_mech_code, eval_inline_mech_code, inline_equation, paragraph_text, strong, highlight, emphasis, inline_code, strikethrough, underline))(input)
355}
356
357// paragraph := +paragraph_element ;
358pub fn inline_paragraph(input: ParseString) -> ParseResult<Paragraph> {
359  let (input, _) = peek(paragraph_element)(input)?;
360  let (input, elements) = many1(
361    pair(
362      is_not(new_line),
363      paragraph_element
364    )
365  )(input)?;
366  let elements = elements.into_iter().map(|(_,elem)| elem).collect();
367  Ok((input, Paragraph{elements, error_range: None}))
368}
369
370// paragraph := +paragraph_element ;
371pub fn paragraph(input: ParseString) -> ParseResult<Paragraph> {
372  let (input, _) = peek(paragraph_element)(input)?;
373  let (input, elements) = many1(
374    pair(
375      is_not(alt((null(new_line), null(mika_section_close), null(idea_sigil)))),
376      labelr!(paragraph_element, 
377              |input| recover::<ParagraphElement, _>(input, skip_till_paragraph_element),
378              "Unexpected paragraph element")
379    )
380  )(input)?;
381  let elements = elements.into_iter().map(|(_,elem)| elem).collect();
382  Ok((input, Paragraph{elements, error_range: None}))
383}
384
385// paragraph-newline := +paragraph_element, new_line ;
386pub fn paragraph_newline(input: ParseString) -> ParseResult<Paragraph> {
387  let (input, elements) = paragraph(input)?;
388  let (input, _) = new_line(input)?;
389  Ok((input, elements))
390}
391
392// indented-ordered-list-item := ws, number, ".", +text, new_line*; 
393pub fn ordered_list_item(input: ParseString) -> ParseResult<(Number,Paragraph)> {
394  let (input, number) = number(input)?;
395  let (input, _) = period(input)?;
396  let (input, list_item) = labelr!(paragraph_newline, |input| recover::<Paragraph, _>(input, skip_till_eol), "Expects paragraph as list item")(input)?;
397  Ok((input, (number,list_item)))
398}
399
400// checked-item := "-", ("[", "x", "]"), paragraph ;
401pub fn checked_item(input: ParseString) -> ParseResult<(bool,Paragraph)> {
402  let (input, _) = dash(input)?;
403  let (input, _) = left_bracket(input)?;
404  let (input, _) = alt((tag("x"),tag("✓"),tag("✗")))(input)?;
405  let (input, _) = right_bracket(input)?;
406  let (input, list_item) = labelr!(paragraph_newline, |input| recover::<Paragraph, _>(input, skip_till_eol), "Expects paragraph as list item")(input)?;
407  Ok((input, (true,list_item)))
408}
409
410// unchecked-item := "-", ("[", whitespace0, "]"), paragraph ;
411pub fn unchecked_item(input: ParseString) -> ParseResult<(bool,Paragraph)> {
412  let (input, _) = dash(input)?;
413  let (input, _) = left_bracket(input)?;
414  let (input, _) = whitespace0(input)?;
415  let (input, _) = right_bracket(input)?;
416  let (input, list_item) = labelr!(paragraph_newline, |input| recover::<Paragraph, _>(input, skip_till_eol), "Expects paragraph as list item")(input)?;
417  Ok((input, (false,list_item)))
418}
419
420// check-list-item := checked-item | unchecked-item ;
421pub fn check_list_item(input: ParseString) -> ParseResult<(bool,Paragraph)> {
422  let (input, item) = alt((checked_item, unchecked_item))(input)?;
423  Ok((input, item))
424}
425
426pub fn check_list(mut input: ParseString, level: usize) -> ParseResult<MDList> {
427  let mut items = vec![];
428  loop {
429    // Calculate current line indent
430    let mut indent = 0;
431    let mut current = input.peek(indent);
432    while current == Some(" ") || current == Some("\t") {
433      indent += 1;
434      current = input.peek(indent);
435    }
436    // If indent is less than current level, we are done parsing this list level
437    if indent < level {
438      break;
439    }
440    // Consume whitespace
441    let (next_input, _) = many0(space_tab)(input.clone())?;
442    // Try parsing a checklist item
443    let (next_input, list_item) = match check_list_item(next_input.clone()) {
444      Ok((next_input, list_item)) => (next_input, list_item),
445      Err(err) => {
446        if !items.is_empty() {
447          break;
448        } else {
449          return Err(err);
450        }
451      }
452    };
453    // Look ahead to next line's indent
454    let mut lookahead_indent = 0;
455    let mut current = next_input.peek(lookahead_indent);
456    while current == Some(" ") || current == Some("\t") {
457      lookahead_indent += 1;
458      current = next_input.peek(lookahead_indent);
459    }
460    input = next_input;
461    if lookahead_indent < level {
462      // End of this list level
463      items.push((list_item, None));
464      break;
465    } else if lookahead_indent == level {
466      // Same level, continue
467      items.push((list_item, None));
468      continue;
469    } else {
470      // Nested sublist: parse recursively
471      let (next_input, sublist_md) = sublist(input.clone(), lookahead_indent)?;
472      items.push((list_item, Some(sublist_md)));
473      input = next_input;
474    }
475  }
476  Ok((input, MDList::Check(items)))
477}
478
479
480// unordered_list := +list_item, ?new_line, *whitespace ;
481pub fn unordered_list(mut input: ParseString, level: usize) -> ParseResult<MDList> {
482  let mut items = vec![];
483  loop {
484    let mut indent = 0;
485    let mut current = input.peek(indent);
486    while current == Some(" ") || current == Some("\t") {
487      indent += 1;
488      current = input.peek(indent);
489    }
490    // If indentation is less than the current level, return to parent list
491    if indent < level {
492      return Ok((input, MDList::Unordered(items)));
493    }
494    let (next_input, _) = many0(space_tab)(input.clone())?;
495    // Try to parse a list item
496    let (next_input, list_item) = match unordered_list_item(next_input.clone()) {
497      Ok((next_input, list_item)) => (next_input, list_item),
498      Err(err) => {
499        if !items.is_empty() {
500          return Ok((input, MDList::Unordered(items)));
501        } else {
502          return Err(err);
503        }
504      }
505    };
506    // Look ahead at the next line to determine indent
507    let mut lookahead_indent = 0;
508    let mut current = next_input.peek(lookahead_indent);
509    while current == Some(" ") || current == Some("\t") {
510      lookahead_indent += 1;
511      current = next_input.peek(lookahead_indent);
512    }
513    input = next_input;
514    if lookahead_indent < level {
515      // This is the last item at the current list level
516      items.push((list_item, None));
517      return Ok((input, MDList::Unordered(items)));
518    } else if lookahead_indent == level {
519      // Continue at the same level
520      items.push((list_item, None));
521      continue;
522    } else {
523      // Nested list detected
524      let (next_input, sub) = sublist(input.clone(), lookahead_indent)?;
525      items.push((list_item, Some(sub)));
526      input = next_input;
527    }
528  }
529}
530
531// ordered-list := +ordered-list-item, ?new-line, *whitespace ;
532pub fn ordered_list(mut input: ParseString, level: usize) -> ParseResult<MDList> {
533  let mut items = vec![];
534  loop {
535    let mut indent = 0;
536    let mut current = input.peek(indent);
537    while current == Some(" ") || current == Some("\t") {
538      indent += 1;
539      current = input.peek(indent);
540    }
541    // If indent drops below current level, return to parent
542    if indent < level {
543      let start = items.first()
544        .map(|item: &((Number, Paragraph), Option<MDList>)| item.0.0.clone())
545        .unwrap_or(Number::from_integer(1));
546      return Ok((input, MDList::Ordered(OrderedList { start, items })));
547    }
548    // Consume whitespace
549    let (next_input, _) = many0(space_tab)(input.clone())?;
550    // Try to parse an ordered list item
551    let (next_input, (list_item, _)) = match tuple((ordered_list_item, is_not(tuple((dash, dash)))))(next_input.clone()) {
552      Ok((next_input, res)) => (next_input, res),
553      Err(err) => {
554        if !items.is_empty() {
555          let start = items.first()
556            .map(|((number, _), _)| number.clone())
557            .unwrap_or(Number::from_integer(1));
558          return Ok((input, MDList::Ordered(OrderedList { start, items })));
559        } else {
560          return Err(err);
561        }
562      }
563    };
564
565    // Determine indentation of the next line
566    let mut lookahead_indent = 0;
567    let mut current = next_input.peek(lookahead_indent);
568    while current == Some(" ") || current == Some("\t") {
569      lookahead_indent += 1;
570      current = next_input.peek(lookahead_indent);
571    }
572
573    input = next_input;
574
575    if lookahead_indent < level {
576      items.push((list_item, None));
577      let start = items.first()
578        .map(|((number, _), _)| number.clone())
579        .unwrap_or(Number::from_integer(1));
580      return Ok((input, MDList::Ordered(OrderedList { start, items })));
581    } else if lookahead_indent == level {
582      items.push((list_item, None));
583      continue;
584    } else {
585      // Nested sublist
586      let (next_input, sub) = sublist(input.clone(), lookahead_indent)?;
587      items.push((list_item, Some(sub)));
588      input = next_input;
589    }
590  }
591}
592
593
594
595pub fn sublist(input: ParseString, level: usize) -> ParseResult<MDList> {
596  let (input, list) = match ordered_list(input.clone(), level) {
597    Ok((input, list)) => (input, list),
598    _ => match check_list(input.clone(), level) {
599      Ok((input, list)) => (input, list),
600      _ => match unordered_list(input.clone(), level) {
601        Ok((input, list)) => (input, list),
602        Err(err) => { return Err(err); }
603      }
604    }
605  };
606  Ok((input, list))
607}
608
609// mechdown-list := ordered-list | unordered-list ;
610pub fn mechdown_list(input: ParseString) -> ParseResult<MDList> {
611  let (input, list) = match ordered_list(input.clone(), 0) {
612    Ok((input, list)) => (input, list),
613    _ => match check_list(input.clone(), 0) {
614      Ok((input, list)) => (input, list),
615      _ => match unordered_list(input.clone(), 0) {
616        Ok((input, list)) => (input, list),
617        Err(err) => { return Err(err); }
618      }
619    }
620  };
621  Ok((input, list))
622}
623
624// list_item := dash, <space+>, <paragraph>, new_line* ;
625pub fn unordered_list_item(input: ParseString) -> ParseResult<(Option<Token>,Paragraph)> {
626  let msg1 = "Expects space after dash";
627  let msg2 = "Expects paragraph as list item";
628  let (input, _) = dash(input)?;
629  let (input, bullet) = opt(tuple((left_parenthesis, emoji, right_parenthesis)))(input)?;
630  let (input, _) = labelr!(null(many1(space)), skip_nil, msg1)(input)?;
631  let (input, list_item) = labelr!(paragraph_newline, |input| recover::<Paragraph, _>(input, skip_till_eol), msg2)(input)?;
632  let (input, _) = many0(new_line)(input)?;
633  let bullet = match bullet {
634    Some((_,b,_)) => Some(b),
635    None => None,
636  };
637  Ok((input,  (bullet, list_item)))
638}
639
640// codeblock-sigil := "```" | "~~~" ;
641pub fn codeblock_sigil(input: ParseString) -> ParseResult<fn(ParseString) -> ParseResult<Token>> {
642  let (input, sgl_tkn) = alt((grave_codeblock_sigil, tilde_codeblock_sigil))(input)?;
643  let sgl_cmb = match sgl_tkn.kind {
644    TokenKind::GraveCodeBlockSigil => grave_codeblock_sigil,
645    TokenKind::TildeCodeBlockSigil => tilde_codeblock_sigil,
646    _ => unreachable!(),
647  };
648  Ok((input, sgl_cmb))
649}
650
651//
652pub fn code_block(input: ParseString) -> ParseResult<SectionElement> {
653  let msg1 = "Expects 3 graves to start a code block";
654  let msg2 = "Expects new_line";
655  let msg3 = "Expects 3 graves followed by new_line to terminate a code block";
656  let (input, (end_sgl,r)) = range(codeblock_sigil)(input)?;
657  let (input, _) = many0(space_tab)(input)?;
658  let (input, code_id) = many0(tuple((is_not(left_brace),text)))(input)?;
659  let code_id = code_id.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>();
660  let (input, options) = opt(option_map)(input)?;
661  let (input, _) = many0(space_tab)(input)?;
662  let (input, _) = label!(new_line, msg2)(input)?;
663  let (input, (text,src_range)) = range(many0(nom_tuple((
664    is_not(end_sgl),
665    any,
666  ))))(input)?;
667  let (input, _) = end_sgl(input)?;
668  let (input, _) = whitespace0(input)?;
669  let block_src: Vec<char> = text.into_iter().flat_map(|(_, s)| s.chars().collect::<Vec<char>>()).collect();
670  let code_token = Token::new(TokenKind::CodeBlock, src_range, block_src.clone());
671
672  let code_id = code_id.iter().flat_map(|tkn| tkn.chars.clone().into_iter().collect::<Vec<char>>()).collect::<String>();
673  match code_id.as_str() {
674    "ebnf" => {
675      let ebnf_text = block_src.iter().collect::<String>();
676      match parse_grammar(&ebnf_text) {
677        Ok(grammar_tree) => {return Ok((input, SectionElement::Grammar(grammar_tree)));},
678        Err(err) => {
679          println!("Error parsing EBNF grammar: {:?}", err);
680          todo!();
681        }
682      }
683    }
684    tag => {
685      // if x begins with mec, mech, or 🤖
686      if tag.starts_with("mech") || tag.starts_with("mec") || tag.starts_with("🤖") {
687
688        // get rid of the prefix and then treat the rest of the string after : as an identifier
689        let rest = tag.trim_start_matches("mech").trim_start_matches("mec").trim_start_matches("🤖").trim_start_matches(":");
690        
691        let config = if rest == "" {BlockConfig { namespace_str: "".to_string(), namespace: 0, disabled: false, hidden: false}}
692        else if rest == "disabled" { BlockConfig { namespace_str: "".to_string(), namespace: 0, disabled: true, hidden: false} }
693        else if rest == "hidden" { BlockConfig { namespace_str: "".to_string(), namespace: 0, disabled: false, hidden: true} }
694        else { BlockConfig { namespace_str: rest.to_string(), namespace: hash_str(rest), disabled: false, hidden: false} };
695
696        let mech_src = block_src.iter().collect::<String>();
697        let graphemes = graphemes::init_source(&mech_src);
698        let parse_string = ParseString::new(&graphemes);
699
700        match mech_code(parse_string) {
701          Ok((_, mech_tree)) => {
702            // TODO what if not all the input is parsed? Is that handled?
703            return Ok((input, SectionElement::FencedMechCode(FencedMechCode{code: mech_tree, config, options})));
704          },
705          Err(err) => {
706            return Err(nom::Err::Error(ParseError {
707                cause_range: SourceRange::default(),
708                remaining_input: input,
709                error_detail: ParseErrorDetail {
710                    message: "Generic error parsing Mech code block",
711                    annotation_rngs: Vec::new(),
712                },
713            }));
714          }
715        };
716      } else if tag.starts_with("equation") || tag.starts_with("eq") || tag.starts_with("math") || tag.starts_with("latex") || tag.starts_with("tex") {
717          return Ok((input, SectionElement::Equation(code_token)));
718      } else if tag.starts_with("diagram") || tag.starts_with("chart") || tag.starts_with("mermaid") {
719          return Ok((input, SectionElement::Diagram(code_token)));          
720      } else {
721        // Some other code block, just keep moving although we might want to do something with it later
722      }
723    }
724  } 
725  Ok((input, SectionElement::CodeBlock(code_token)))
726}
727
728pub fn thematic_break(input: ParseString) -> ParseResult<SectionElement> {
729  let (input, _) = many1(asterisk)(input)?;
730  let (input, _) = many0(space_tab)(input)?;
731  let (input, _) = new_line(input)?;
732  Ok((input, SectionElement::ThematicBreak))
733}
734
735// footnote := "[^", +text, "]", ":", ws0, paragraph ;
736pub fn footnote(input: ParseString) -> ParseResult<Footnote> {
737  let (input, _) = footnote_prefix(input)?;
738  let (input, text) = many1(tuple((is_not(right_bracket),text)))(input)?;
739  let (input, _) = right_bracket(input)?;
740  let (input, _) = colon(input)?;
741  let (input, _) = whitespace0(input)?;
742  let (input, paragraph) = many1(paragraph_newline)(input)?;
743  let mut tokens = text.into_iter().map(|(_,tkn)| tkn).collect::<Vec<Token>>();
744  let footnote_text = Token::merge_tokens(&mut tokens).unwrap();
745  let footnote = (footnote_text, paragraph);
746  Ok((input, footnote))
747}
748
749// prompt := prompt-sigil, *space, +paragraph ;
750pub fn prompt(input: ParseString) -> ParseResult<SectionElement> {
751  let (input, _) = prompt_sigil(input)?;
752  let (input, _) = many0(space_tab)(input)?;
753  let (input, element) = section_element(input)?;
754  Ok((input, SectionElement::Prompt(Box::new(element))))
755}
756
757pub fn blank_line(input: ParseString) -> ParseResult<Vec<Token>> {
758  let (input, mut st) = many0(space_tab)(input)?;
759  let (input, n) = new_line(input)?;
760  st.push(n);
761  Ok((input, st))
762}
763
764// question-block := question-sigil, *space, +paragraph ;
765pub fn question_block(input: ParseString) -> ParseResult<SectionElement> {
766  let (input, _) = question_sigil(input)?;
767  let (input, _) = many0(space_tab)(input)?;
768  let (input, paragraphs) = many1(paragraph_newline)(input)?;
769  Ok((input, SectionElement::QuestionBlock(paragraphs)))
770}
771
772// info-block := info-sigil, *space, +paragraph ;
773pub fn info_block(input: ParseString) -> ParseResult<SectionElement> {
774  let (input, _) = info_sigil(input)?;
775  let (input, _) = many0(space_tab)(input)?;
776  let (input, paragraphs) = many1(paragraph_newline)(input)?;
777  Ok((input, SectionElement::InfoBlock(paragraphs)))
778}
779
780// quote-block := quote-sigil, *space, +paragraph ;
781pub fn quote_block(input: ParseString) -> ParseResult<SectionElement> {
782  let (input, _) = peek(is_not(float_sigil))(input)?;
783  let (input, _) = peek(is_not(prompt_sigil))(input)?;
784  let (input, _) = quote_sigil(input)?;
785  let (input, _) = many0(space_tab)(input)?;
786  let (input, paragraphs) = many1(paragraph_newline)(input)?;
787  Ok((input, SectionElement::QuoteBlock(paragraphs)))
788}
789
790// warning-block := warning-sigil, *space, +paragraph ;
791pub fn warning_block(input: ParseString) -> ParseResult<SectionElement> {
792  let (input, _) = peek(is_not(float_sigil))(input)?;
793  let (input, _) = warning_sigil(input)?;
794  let (input, _) = many0(space_tab)(input)?;
795  let (input, paragraphs) = many1(paragraph_newline)(input)?;
796  Ok((input, SectionElement::WarningBlock(paragraphs)))
797}
798
799// success-block := success-sigil, *space, +paragraph ;
800pub fn success_block(input: ParseString) -> ParseResult<SectionElement> {
801  let (input, _) = peek(is_not(float_sigil))(input)?;
802  let (input, _) = alt((success_sigil, success_check_sigil))(input)?;
803  let (input, _) = many0(space_tab)(input)?;
804  let (input, paragraphs) = many1(paragraph_newline)(input)?;
805  Ok((input, SectionElement::SuccessBlock(paragraphs)))
806}
807
808// error-block := error-sigil, *space, +paragraph ;
809pub fn error_block(input: ParseString) -> ParseResult<SectionElement> {
810  let (input, _) = peek(is_not(float_sigil))(input)?;
811  let (input, _) = alt((error_sigil, error_alt_sigil))(input)?;
812  let (input, _) = many0(space_tab)(input)?;
813  let (input, paragraphs) = many1(paragraph_newline)(input)?;
814  Ok((input, SectionElement::ErrorBlock(paragraphs)))
815}
816
817// idea-block := idea-sigil, *space, +paragraph ;
818pub fn idea_block(input: ParseString) -> ParseResult<SectionElement> {
819  let (input, _) = idea_sigil(input)?;
820  let (input, _) = many0(space_tab)(input)?;
821  let (input, paragraphs) = many1(paragraph_newline)(input)?;
822  Ok((input, SectionElement::IdeaBlock(paragraphs)))
823}
824
825// abstract-element := abstract-sigil, *space, +paragraph ;
826pub fn abstract_el(input: ParseString) -> ParseResult<SectionElement> {
827  let (input, _) = abstract_sigil(input)?;
828  let (input, _) = many0(space_tab)(input)?;
829  let (input, paragraphs) = many1(paragraph_newline)(input)?;
830  Ok((input, SectionElement::Abstract(paragraphs)))
831}
832
833// equation := "$$" , +text ;
834pub fn equation(input: ParseString) -> ParseResult<Token> {
835  let (input, _) = equation_sigil(input)?;
836  let (input, mut txt) = many1(alt((backslash,text)))(input)?;
837  let mut eqn = Token::merge_tokens(&mut txt).unwrap();
838  Ok((input, eqn))
839}
840
841// citation := "[", (identifier | number), "]", ":", ws0, paragraph, ws0, ?("(", +text, ")") ;
842pub fn citation(input: ParseString) -> ParseResult<Citation> {
843  let (input, _) = left_bracket(input)?;
844  let (input, mut id) = many1(alphanumeric)(input)?;
845  let (input, _) = right_bracket(input)?;
846  let (input, _) = colon(input)?;
847  let (input, _) = whitespace0(input)?;
848  let (input, txt) = paragraph(input)?;
849  let (input, _) = whitespace0(input)?;
850  let id = Token::merge_tokens(&mut id).unwrap();
851  Ok((input, Citation{id, text: txt}))
852}
853
854// float-sigil := ">>" | "<<" ;
855pub fn float_sigil(input: ParseString) -> ParseResult<FloatDirection> {
856  let (input, d) = alt((float_left, float_right))(input)?;
857  let d = match d.kind {
858    TokenKind::FloatLeft => FloatDirection::Left,
859    TokenKind::FloatRight => FloatDirection::Right,
860    _ => unreachable!(),
861  };
862  Ok((input, d))
863}
864
865// float := float-sigil, section-element ;
866pub fn float(input: ParseString) -> ParseResult<(Box<SectionElement>,FloatDirection)> {
867  let (input, direction) = float_sigil(input)?;
868  let (input, _) = many0(space_tab)(input)?;
869  let (input, el) = section_element(input)?;
870  Ok((input, (Box::new(el), direction)))
871}
872
873// float := float-sigil, section-element ;
874pub fn not_mech_code(input: ParseString) -> ParseResult<()> {
875  let (input, _) = alt((null(question_block), 
876    null(info_block),  
877    null(success_block),
878    null(warning_block),
879    null(error_block),
880    null(idea_block),
881    null(img), 
882    null(mika_section_close),
883    null(float)))(input)?;
884  Ok((input, ()))
885}
886
887// section-element := mech-code | question-block | info-block | list | footnote | citation | abstract-element | img | equation | table | float | quote-block | code-block | thematic-break | subtitle | paragraph ;
888pub fn section_element(input: ParseString) -> ParseResult<SectionElement> {
889  let parsers: Vec<(&'static str, Box<dyn Fn(ParseString) -> ParseResult<SectionElement>>)> = vec![
890    ("list",            Box::new(|i| mechdown_list(i).map(|(i, lst)| (i, SectionElement::List(lst))))),
891    ("prompt",          Box::new(prompt)),
892    ("footnote",        Box::new(|i| footnote(i).map(|(i, f)| (i, SectionElement::Footnote(f))))),
893    ("citation",        Box::new(|i| citation(i).map(|(i, c)| (i, SectionElement::Citation(c))))),
894    ("abstract",        Box::new(abstract_el)),
895    ("img",             Box::new(|i| img(i).map(|(i, img)| (i, SectionElement::Image(img))))),
896    ("equation",        Box::new(|i| equation(i).map(|(i, e)| (i, SectionElement::Equation(e))))),
897    ("table",           Box::new(|i| mechdown_table(i).map(|(i, t)| (i, SectionElement::Table(t))))),
898    ("float",           Box::new(|i| float(i).map(|(i, f)| (i, SectionElement::Float(f))))),
899    //("quote_block",     Box::new(quote_block)),
900    ("code_block",      Box::new(code_block)),
901    ("thematic_break",  Box::new(|i| thematic_break(i).map(|(i, _)| (i, SectionElement::ThematicBreak)))),
902    ("subtitle",        Box::new(|i| subtitle(i).map(|(i, s)| (i, SectionElement::Subtitle(s))))),
903    ("question_block",  Box::new(question_block)),
904    ("info_block",      Box::new(info_block)),
905    ("success_block",   Box::new(success_block)),
906    ("warning_block",   Box::new(warning_block)),
907    ("error_block",     Box::new(error_block)),
908    ("idea_block",      Box::new(idea_block)),
909    ("paragraph",       Box::new(|i| paragraph(i).map(|(i, p)| (i, SectionElement::Paragraph(p))))),
910  ];
911
912  alt_best(input, &parsers)
913  
914}
915
916// section := ?ul-subtitle, +section-element ;
917pub fn section(input: ParseString) -> ParseResult<Section> {
918  let (input, subtitle) = opt(ul_subtitle)(input)?;
919
920  let mut elements = vec![];
921
922  let mut new_input = input.clone();
923
924  loop {
925    // Stop if EOF reached
926    if new_input.cursor >= new_input.graphemes.len() {
927      //println!("EOF reached while parsing section");
928      break;
929    }
930
931    // Stop if the next thing is a new section (peek, do not consume)
932    if ul_subtitle(new_input.clone()).is_ok() {
933      //println!("Next section detected, ending current section");
934      break;
935    }
936
937    #[cfg(feature = "mika")]
938    if mika_section_close(new_input.clone()).is_ok() {
939      break;
940    }
941
942    /*let (input, sct_elmnt) = labelr!(
943      section_element,
944      |input| recover::<SectionElement, _>(input, skip_till_eol),
945      "Expected a section element."
946    )(input.clone())?;*/
947
948    //elements.push(sct_elmnt);
949    //let (input, _) = many0(blank_line)(input.clone())?;
950
951    #[cfg(feature = "mika")]
952    match mika(new_input.clone()) {
953      Ok((input, mika)) => {
954        elements.push(SectionElement::Mika(mika));
955        new_input = input;
956        continue;
957      }
958      Err(e) => {
959        // not mika code, try mech code
960        //return Err(e);
961      }
962    }
963  
964    // check if it's mech_code first, we'll prioritize that
965    match mech_code(new_input.clone()) {
966      Ok((input, mech_tree)) => {
967        elements.push(SectionElement::MechCode(mech_tree));
968        new_input = input;
969        continue;
970      }
971      Err(e) => {
972        // not mech code, try section_element
973        //return Err(e);
974      }
975    }
976
977    match section_element(new_input.clone()) {
978      Ok((input, element)) => {
979
980        elements.push(element);
981
982        // Skip any blank lines after the element
983        let (input, _) = many0(blank_line)(input.clone())?;
984        new_input = input;
985      }
986      Err(err) => {
987        // Propagate hard errors
988        return Err(err);
989      }
990    }
991  }
992  Ok((new_input, Section { subtitle, elements }))
993}
994
995// body := whitespace0, +(section, eof), eof ;
996pub fn body(input: ParseString) -> ParseResult<Body> {
997  let (mut input, _) = whitespace0(input)?;
998  let mut sections = vec![];
999  let mut new_input = input.clone();
1000  loop {
1001    if new_input.cursor >= new_input.graphemes.len() {
1002      break;
1003    }
1004    // Try parsing a section
1005    match section(new_input.clone()) {
1006      Ok((input, sect)) => {
1007        //println!("Parsed section: {:#?}", sect);
1008        sections.push(sect);
1009        new_input = input;
1010      }
1011      Err(err) => {
1012        return Err(err);
1013      }
1014    }
1015  }
1016  Ok((new_input, Body { sections }))
1017}