nu_parser/
flatten.rs

1use nu_protocol::{
2    DeclId, GetSpan, Span, SyntaxShape, VarId,
3    ast::{
4        Argument, Block, Expr, Expression, ExternalArgument, ImportPatternMember, ListItem,
5        MatchPattern, PathMember, Pattern, Pipeline, PipelineElement, PipelineRedirection,
6        RecordItem,
7    },
8    engine::StateWorkingSet,
9};
10use std::fmt::{Display, Formatter, Result};
11
12#[derive(Debug, Eq, PartialEq, Ord, Clone, PartialOrd)]
13pub enum FlatShape {
14    Binary,
15    Block,
16    Bool,
17    Closure,
18    Custom(DeclId),
19    DateTime,
20    Directory,
21    // The stored span contains the name of the called external command:
22    // This is only different from the span containing the call's head if this
23    // call is through an alias, and is only useful for its contents (not its location).
24    External(Box<Span>),
25    ExternalArg,
26    ExternalResolved,
27    Filepath,
28    Flag,
29    Float,
30    Garbage,
31    GlobInterpolation,
32    GlobPattern,
33    Int,
34    InternalCall(DeclId),
35    Keyword,
36    List,
37    Literal,
38    MatchPattern,
39    Nothing,
40    Operator,
41    Pipe,
42    Range,
43    RawString,
44    Record,
45    Redirection,
46    Signature,
47    String,
48    StringInterpolation,
49    Table,
50    Variable(VarId),
51    VarDecl(VarId),
52}
53
54impl FlatShape {
55    pub fn as_str(&self) -> &str {
56        match self {
57            FlatShape::Binary => "shape_binary",
58            FlatShape::Block => "shape_block",
59            FlatShape::Bool => "shape_bool",
60            FlatShape::Closure => "shape_closure",
61            FlatShape::Custom(_) => "shape_custom",
62            FlatShape::DateTime => "shape_datetime",
63            FlatShape::Directory => "shape_directory",
64            FlatShape::External(_) => "shape_external",
65            FlatShape::ExternalArg => "shape_externalarg",
66            FlatShape::ExternalResolved => "shape_external_resolved",
67            FlatShape::Filepath => "shape_filepath",
68            FlatShape::Flag => "shape_flag",
69            FlatShape::Float => "shape_float",
70            FlatShape::Garbage => "shape_garbage",
71            FlatShape::GlobInterpolation => "shape_glob_interpolation",
72            FlatShape::GlobPattern => "shape_globpattern",
73            FlatShape::Int => "shape_int",
74            FlatShape::InternalCall(_) => "shape_internalcall",
75            FlatShape::Keyword => "shape_keyword",
76            FlatShape::List => "shape_list",
77            FlatShape::Literal => "shape_literal",
78            FlatShape::MatchPattern => "shape_match_pattern",
79            FlatShape::Nothing => "shape_nothing",
80            FlatShape::Operator => "shape_operator",
81            FlatShape::Pipe => "shape_pipe",
82            FlatShape::Range => "shape_range",
83            FlatShape::RawString => "shape_raw_string",
84            FlatShape::Record => "shape_record",
85            FlatShape::Redirection => "shape_redirection",
86            FlatShape::Signature => "shape_signature",
87            FlatShape::String => "shape_string",
88            FlatShape::StringInterpolation => "shape_string_interpolation",
89            FlatShape::Table => "shape_table",
90            FlatShape::Variable(_) => "shape_variable",
91            FlatShape::VarDecl(_) => "shape_vardecl",
92        }
93    }
94}
95
96impl Display for FlatShape {
97    fn fmt(&self, f: &mut Formatter) -> Result {
98        f.write_str(self.as_str())
99    }
100}
101
102/*
103The `_into` functions below (e.g., `flatten_block_into`) take an existing `output` `Vec`
104and append more data to it. This is to reduce the number of intermediate `Vec`s.
105The non-`into` functions (e.g., `flatten_block`) are part of the crate's public API
106and return a new `Vec` instead of modifying an existing one.
107*/
108
109fn flatten_block_into(
110    working_set: &StateWorkingSet,
111    block: &Block,
112    output: &mut Vec<(Span, FlatShape)>,
113) {
114    for pipeline in &block.pipelines {
115        flatten_pipeline_into(working_set, pipeline, output);
116    }
117}
118
119fn flatten_pipeline_into(
120    working_set: &StateWorkingSet,
121    pipeline: &Pipeline,
122    output: &mut Vec<(Span, FlatShape)>,
123) {
124    for expr in &pipeline.elements {
125        flatten_pipeline_element_into(working_set, expr, output)
126    }
127}
128
129fn flatten_pipeline_element_into(
130    working_set: &StateWorkingSet,
131    pipeline_element: &PipelineElement,
132    output: &mut Vec<(Span, FlatShape)>,
133) {
134    if let Some(span) = pipeline_element.pipe {
135        output.push((span, FlatShape::Pipe));
136    }
137
138    flatten_expression_into(working_set, &pipeline_element.expr, output);
139
140    if let Some(redirection) = pipeline_element.redirection.as_ref() {
141        match redirection {
142            PipelineRedirection::Single { target, .. } => {
143                output.push((target.span(), FlatShape::Redirection));
144                if let Some(expr) = target.expr() {
145                    flatten_expression_into(working_set, expr, output);
146                }
147            }
148            PipelineRedirection::Separate { out, err } => {
149                let (out, err) = if out.span() <= err.span() {
150                    (out, err)
151                } else {
152                    (err, out)
153                };
154
155                output.push((out.span(), FlatShape::Redirection));
156                if let Some(expr) = out.expr() {
157                    flatten_expression_into(working_set, expr, output);
158                }
159                output.push((err.span(), FlatShape::Redirection));
160                if let Some(expr) = err.expr() {
161                    flatten_expression_into(working_set, expr, output);
162                }
163            }
164        }
165    }
166}
167
168fn flatten_positional_arg_into(
169    working_set: &StateWorkingSet,
170    positional: &Expression,
171    shape: &SyntaxShape,
172    output: &mut Vec<(Span, FlatShape)>,
173) {
174    if matches!(shape, SyntaxShape::ExternalArgument)
175        && matches!(positional.expr, Expr::String(..) | Expr::GlobPattern(..))
176    {
177        // Make known external arguments look more like external arguments
178        output.push((positional.span, FlatShape::ExternalArg));
179    } else {
180        flatten_expression_into(working_set, positional, output)
181    }
182}
183
184fn flatten_expression_into(
185    working_set: &StateWorkingSet,
186    expr: &Expression,
187    output: &mut Vec<(Span, FlatShape)>,
188) {
189    match &expr.expr {
190        Expr::AttributeBlock(ab) => {
191            for attr in &ab.attributes {
192                flatten_expression_into(working_set, &attr.expr, output);
193            }
194            flatten_expression_into(working_set, &ab.item, output);
195        }
196        Expr::BinaryOp(lhs, op, rhs) => {
197            flatten_expression_into(working_set, lhs, output);
198            flatten_expression_into(working_set, op, output);
199            flatten_expression_into(working_set, rhs, output);
200        }
201        Expr::UnaryNot(not) => {
202            output.push((
203                Span::new(expr.span.start, expr.span.start + 3),
204                FlatShape::Operator,
205            ));
206            flatten_expression_into(working_set, not, output);
207        }
208        Expr::Collect(_, expr) => {
209            flatten_expression_into(working_set, expr, output);
210        }
211        Expr::Closure(block_id) => {
212            let outer_span = expr.span;
213
214            let block = working_set.get_block(*block_id);
215            let flattened = flatten_block(working_set, block);
216
217            if let Some(first) = flattened.first()
218                && first.0.start > outer_span.start
219            {
220                output.push((
221                    Span::new(outer_span.start, first.0.start),
222                    FlatShape::Closure,
223                ));
224            }
225
226            let last = if let Some(last) = flattened.last() {
227                if last.0.end < outer_span.end {
228                    Some((Span::new(last.0.end, outer_span.end), FlatShape::Closure))
229                } else {
230                    None
231                }
232            } else {
233                // for empty closures
234                Some((outer_span, FlatShape::Closure))
235            };
236
237            output.extend(flattened);
238            if let Some(last) = last {
239                output.push(last);
240            }
241        }
242        Expr::Block(block_id) | Expr::RowCondition(block_id) | Expr::Subexpression(block_id) => {
243            let outer_span = expr.span;
244
245            let flattened = flatten_block(working_set, working_set.get_block(*block_id));
246
247            if let Some(first) = flattened.first()
248                && first.0.start > outer_span.start
249            {
250                output.push((Span::new(outer_span.start, first.0.start), FlatShape::Block));
251            }
252
253            let last = if let Some(last) = flattened.last() {
254                if last.0.end < outer_span.end {
255                    Some((Span::new(last.0.end, outer_span.end), FlatShape::Block))
256                } else {
257                    None
258                }
259            } else {
260                None
261            };
262
263            output.extend(flattened);
264            if let Some(last) = last {
265                output.push(last);
266            }
267        }
268        Expr::Call(call) => {
269            let decl = working_set.get_decl(call.decl_id);
270
271            if call.head.end != 0 {
272                // Make sure we don't push synthetic calls
273                output.push((call.head, FlatShape::InternalCall(call.decl_id)));
274            }
275
276            // Follow positional arguments from the signature.
277            let signature = decl.signature();
278            let mut positional_args = signature
279                .required_positional
280                .iter()
281                .chain(&signature.optional_positional);
282
283            let arg_start = output.len();
284            for arg in &call.arguments {
285                match arg {
286                    Argument::Positional(positional) => {
287                        let positional_arg = positional_args.next();
288                        let shape = positional_arg
289                            .or(signature.rest_positional.as_ref())
290                            .map(|arg| &arg.shape)
291                            .unwrap_or(&SyntaxShape::Any);
292
293                        flatten_positional_arg_into(working_set, positional, shape, output)
294                    }
295                    Argument::Unknown(positional) => {
296                        let shape = signature
297                            .rest_positional
298                            .as_ref()
299                            .map(|arg| &arg.shape)
300                            .unwrap_or(&SyntaxShape::Any);
301
302                        flatten_positional_arg_into(working_set, positional, shape, output)
303                    }
304                    Argument::Named(named) => {
305                        if named.0.span.end != 0 {
306                            // Ignore synthetic flags
307                            output.push((named.0.span, FlatShape::Flag));
308                        }
309                        if let Some(expr) = &named.2 {
310                            flatten_expression_into(working_set, expr, output);
311                        }
312                    }
313                    Argument::Spread(expr) => {
314                        output.push((
315                            Span::new(expr.span.start - 3, expr.span.start),
316                            FlatShape::Operator,
317                        ));
318                        flatten_expression_into(working_set, expr, output);
319                    }
320                }
321            }
322            // sort these since flags and positional args can be intermixed
323            output[arg_start..].sort();
324        }
325        Expr::ExternalCall(head, args) => {
326            if let Expr::String(..) | Expr::GlobPattern(..) = &head.expr {
327                output.push((
328                    head.span,
329                    // If this external call is through an alias, then head.span contains the
330                    // name of the alias (needed to highlight the right thing), but we also need
331                    // the name of the aliased command (to decide *how* to highlight the call).
332                    // The parser actually created this head by cloning from the alias's definition
333                    // and then just overwriting the `span` field - but `span_id` still points to
334                    // the original span, so we can recover it from there.
335                    FlatShape::External(Box::new(working_set.get_span(head.span_id))),
336                ));
337            } else {
338                flatten_expression_into(working_set, head, output);
339            }
340
341            for arg in args.as_ref() {
342                match arg {
343                    ExternalArgument::Regular(expr) => {
344                        if let Expr::String(..) | Expr::GlobPattern(..) = &expr.expr {
345                            output.push((expr.span, FlatShape::ExternalArg));
346                        } else {
347                            flatten_expression_into(working_set, expr, output);
348                        }
349                    }
350                    ExternalArgument::Spread(expr) => {
351                        output.push((
352                            Span::new(expr.span.start - 3, expr.span.start),
353                            FlatShape::Operator,
354                        ));
355                        flatten_expression_into(working_set, expr, output);
356                    }
357                }
358            }
359        }
360        Expr::Garbage => output.push((expr.span, FlatShape::Garbage)),
361        Expr::Nothing => output.push((expr.span, FlatShape::Nothing)),
362        Expr::DateTime(_) => output.push((expr.span, FlatShape::DateTime)),
363        Expr::Binary(_) => output.push((expr.span, FlatShape::Binary)),
364        Expr::Int(_) => output.push((expr.span, FlatShape::Int)),
365        Expr::Float(_) => output.push((expr.span, FlatShape::Float)),
366        Expr::MatchBlock(matches) => {
367            for (pattern, expr) in matches {
368                flatten_pattern_into(pattern, output);
369                flatten_expression_into(working_set, expr, output);
370            }
371        }
372        Expr::ValueWithUnit(value) => {
373            flatten_expression_into(working_set, &value.expr, output);
374            output.push((value.unit.span, FlatShape::String));
375        }
376        Expr::CellPath(cell_path) => {
377            output.extend(cell_path.members.iter().map(|member| match *member {
378                PathMember::String { span, .. } => (span, FlatShape::String),
379                PathMember::Int { span, .. } => (span, FlatShape::Int),
380            }));
381        }
382        Expr::FullCellPath(cell_path) => {
383            flatten_expression_into(working_set, &cell_path.head, output);
384            output.extend(cell_path.tail.iter().map(|member| match *member {
385                PathMember::String { span, .. } => (span, FlatShape::String),
386                PathMember::Int { span, .. } => (span, FlatShape::Int),
387            }));
388        }
389        Expr::ImportPattern(import_pattern) => {
390            output.push((import_pattern.head.span, FlatShape::String));
391
392            for member in &import_pattern.members {
393                match member {
394                    ImportPatternMember::Glob { span } => output.push((*span, FlatShape::String)),
395                    ImportPatternMember::Name { span, .. } => {
396                        output.push((*span, FlatShape::String))
397                    }
398                    ImportPatternMember::List { names } => {
399                        output.extend(names.iter().map(|&(_, span)| (span, FlatShape::String)))
400                    }
401                }
402            }
403        }
404        Expr::Overlay(_) => output.push((expr.span, FlatShape::String)),
405        Expr::Range(range) => {
406            if let Some(f) = &range.from {
407                flatten_expression_into(working_set, f, output);
408            }
409            if let Some(s) = &range.next {
410                output.push((range.operator.next_op_span, FlatShape::Operator));
411                flatten_expression_into(working_set, s, output);
412            }
413            output.push((range.operator.span, FlatShape::Operator));
414            if let Some(t) = &range.to {
415                flatten_expression_into(working_set, t, output);
416            }
417        }
418        Expr::Bool(_) => output.push((expr.span, FlatShape::Bool)),
419        Expr::Filepath(_, _) => output.push((expr.span, FlatShape::Filepath)),
420        Expr::Directory(_, _) => output.push((expr.span, FlatShape::Directory)),
421        Expr::GlobPattern(_, _) => output.push((expr.span, FlatShape::GlobPattern)),
422        Expr::List(list) => {
423            let outer_span = expr.span;
424            let mut last_end = outer_span.start;
425
426            for item in list {
427                match item {
428                    ListItem::Item(expr) => {
429                        let flattened = flatten_expression(working_set, expr);
430
431                        if let Some(first) = flattened.first()
432                            && first.0.start > last_end
433                        {
434                            output.push((Span::new(last_end, first.0.start), FlatShape::List));
435                        }
436
437                        if let Some(last) = flattened.last() {
438                            last_end = last.0.end;
439                        }
440
441                        output.extend(flattened);
442                    }
443                    ListItem::Spread(op_span, expr) => {
444                        if op_span.start > last_end {
445                            output.push((Span::new(last_end, op_span.start), FlatShape::List));
446                        }
447                        output.push((*op_span, FlatShape::Operator));
448                        last_end = op_span.end;
449
450                        let flattened_inner = flatten_expression(working_set, expr);
451                        if let Some(first) = flattened_inner.first()
452                            && first.0.start > last_end
453                        {
454                            output.push((Span::new(last_end, first.0.start), FlatShape::List));
455                        }
456                        if let Some(last) = flattened_inner.last() {
457                            last_end = last.0.end;
458                        }
459                        output.extend(flattened_inner);
460                    }
461                }
462            }
463
464            if last_end < outer_span.end {
465                output.push((Span::new(last_end, outer_span.end), FlatShape::List));
466            }
467        }
468        Expr::StringInterpolation(exprs) => {
469            let mut flattened = vec![];
470            for expr in exprs {
471                flatten_expression_into(working_set, expr, &mut flattened);
472            }
473
474            if let Some(first) = flattened.first()
475                && first.0.start != expr.span.start
476            {
477                // If we aren't a bare word interpolation, also highlight the outer quotes
478                output.push((
479                    Span::new(expr.span.start, expr.span.start + 2),
480                    FlatShape::StringInterpolation,
481                ));
482                flattened.push((
483                    Span::new(expr.span.end - 1, expr.span.end),
484                    FlatShape::StringInterpolation,
485                ));
486            }
487            output.extend(flattened);
488        }
489        Expr::GlobInterpolation(exprs, quoted) => {
490            let mut flattened = vec![];
491            for expr in exprs {
492                flatten_expression_into(working_set, expr, &mut flattened);
493            }
494
495            if *quoted {
496                // If we aren't a bare word interpolation, also highlight the outer quotes
497                output.push((
498                    Span::new(expr.span.start, expr.span.start + 2),
499                    FlatShape::GlobInterpolation,
500                ));
501                flattened.push((
502                    Span::new(expr.span.end - 1, expr.span.end),
503                    FlatShape::GlobInterpolation,
504                ));
505            }
506            output.extend(flattened);
507        }
508        Expr::Record(list) => {
509            let outer_span = expr.span;
510            let mut last_end = outer_span.start;
511
512            for l in list {
513                match l {
514                    RecordItem::Pair(key, val) => {
515                        let flattened_lhs = flatten_expression(working_set, key);
516                        let flattened_rhs = flatten_expression(working_set, val);
517
518                        if let Some(first) = flattened_lhs.first()
519                            && first.0.start > last_end
520                        {
521                            output.push((Span::new(last_end, first.0.start), FlatShape::Record));
522                        }
523                        if let Some(last) = flattened_lhs.last() {
524                            last_end = last.0.end;
525                        }
526                        output.extend(flattened_lhs);
527
528                        if let Some(first) = flattened_rhs.first()
529                            && first.0.start > last_end
530                        {
531                            output.push((Span::new(last_end, first.0.start), FlatShape::Record));
532                        }
533                        if let Some(last) = flattened_rhs.last() {
534                            last_end = last.0.end;
535                        }
536
537                        output.extend(flattened_rhs);
538                    }
539                    RecordItem::Spread(op_span, record) => {
540                        if op_span.start > last_end {
541                            output.push((Span::new(last_end, op_span.start), FlatShape::Record));
542                        }
543                        output.push((*op_span, FlatShape::Operator));
544                        last_end = op_span.end;
545
546                        let flattened = flatten_expression(working_set, record);
547                        if let Some(first) = flattened.first()
548                            && first.0.start > last_end
549                        {
550                            output.push((Span::new(last_end, first.0.start), FlatShape::Record));
551                        }
552                        if let Some(last) = flattened.last() {
553                            last_end = last.0.end;
554                        }
555                        output.extend(flattened);
556                    }
557                }
558            }
559            if last_end < outer_span.end {
560                output.push((Span::new(last_end, outer_span.end), FlatShape::Record));
561            }
562        }
563        Expr::Keyword(kw) => {
564            output.push((kw.span, FlatShape::Keyword));
565            flatten_expression_into(working_set, &kw.expr, output);
566        }
567        Expr::Operator(_) => output.push((expr.span, FlatShape::Operator)),
568        Expr::Signature(_) => output.push((expr.span, FlatShape::Signature)),
569        Expr::String(_) => output.push((expr.span, FlatShape::String)),
570        Expr::RawString(_) => output.push((expr.span, FlatShape::RawString)),
571        Expr::Table(table) => {
572            let outer_span = expr.span;
573            let mut last_end = outer_span.start;
574
575            for col in table.columns.as_ref() {
576                let flattened = flatten_expression(working_set, col);
577                if let Some(first) = flattened.first()
578                    && first.0.start > last_end
579                {
580                    output.push((Span::new(last_end, first.0.start), FlatShape::Table));
581                }
582
583                if let Some(last) = flattened.last() {
584                    last_end = last.0.end;
585                }
586
587                output.extend(flattened);
588            }
589            for row in table.rows.as_ref() {
590                for expr in row.as_ref() {
591                    let flattened = flatten_expression(working_set, expr);
592                    if let Some(first) = flattened.first()
593                        && first.0.start > last_end
594                    {
595                        output.push((Span::new(last_end, first.0.start), FlatShape::Table));
596                    }
597
598                    if let Some(last) = flattened.last() {
599                        last_end = last.0.end;
600                    }
601
602                    output.extend(flattened);
603                }
604            }
605
606            if last_end < outer_span.end {
607                output.push((Span::new(last_end, outer_span.end), FlatShape::Table));
608            }
609        }
610        Expr::Var(var_id) => output.push((expr.span, FlatShape::Variable(*var_id))),
611        Expr::VarDecl(var_id) => output.push((expr.span, FlatShape::VarDecl(*var_id))),
612    }
613}
614
615fn flatten_pattern_into(match_pattern: &MatchPattern, output: &mut Vec<(Span, FlatShape)>) {
616    match &match_pattern.pattern {
617        Pattern::Garbage => output.push((match_pattern.span, FlatShape::Garbage)),
618        Pattern::IgnoreValue => output.push((match_pattern.span, FlatShape::Nothing)),
619        Pattern::IgnoreRest => output.push((match_pattern.span, FlatShape::Nothing)),
620        Pattern::List(items) => {
621            if let Some(first) = items.first() {
622                if let Some(last) = items.last() {
623                    output.push((
624                        Span::new(match_pattern.span.start, first.span.start),
625                        FlatShape::MatchPattern,
626                    ));
627                    for item in items {
628                        flatten_pattern_into(item, output);
629                    }
630                    output.push((
631                        Span::new(last.span.end, match_pattern.span.end),
632                        FlatShape::MatchPattern,
633                    ))
634                }
635            } else {
636                output.push((match_pattern.span, FlatShape::MatchPattern));
637            }
638        }
639        Pattern::Record(items) => {
640            if let Some(first) = items.first() {
641                if let Some(last) = items.last() {
642                    output.push((
643                        Span::new(match_pattern.span.start, first.1.span.start),
644                        FlatShape::MatchPattern,
645                    ));
646                    for (_, pattern) in items {
647                        flatten_pattern_into(pattern, output);
648                    }
649                    output.push((
650                        Span::new(last.1.span.end, match_pattern.span.end),
651                        FlatShape::MatchPattern,
652                    ))
653                }
654            } else {
655                output.push((match_pattern.span, FlatShape::MatchPattern));
656            }
657        }
658        Pattern::Expression(_) | Pattern::Value(_) => {
659            output.push((match_pattern.span, FlatShape::MatchPattern))
660        }
661        Pattern::Variable(var_id) => output.push((match_pattern.span, FlatShape::VarDecl(*var_id))),
662        Pattern::Rest(var_id) => output.push((match_pattern.span, FlatShape::VarDecl(*var_id))),
663        Pattern::Or(patterns) => {
664            for pattern in patterns {
665                flatten_pattern_into(pattern, output);
666            }
667        }
668    }
669}
670
671pub fn flatten_block(working_set: &StateWorkingSet, block: &Block) -> Vec<(Span, FlatShape)> {
672    let mut output = Vec::new();
673    flatten_block_into(working_set, block, &mut output);
674    output
675}
676
677pub fn flatten_pipeline(
678    working_set: &StateWorkingSet,
679    pipeline: &Pipeline,
680) -> Vec<(Span, FlatShape)> {
681    let mut output = Vec::new();
682    flatten_pipeline_into(working_set, pipeline, &mut output);
683    output
684}
685
686pub fn flatten_pipeline_element(
687    working_set: &StateWorkingSet,
688    pipeline_element: &PipelineElement,
689) -> Vec<(Span, FlatShape)> {
690    let mut output = Vec::new();
691    flatten_pipeline_element_into(working_set, pipeline_element, &mut output);
692    output
693}
694
695pub fn flatten_expression(
696    working_set: &StateWorkingSet,
697    expr: &Expression,
698) -> Vec<(Span, FlatShape)> {
699    let mut output = Vec::new();
700    flatten_expression_into(working_set, expr, &mut output);
701    output
702}