use crate::ast::{
Arg, Assignment, BinaryOp, CaseBranch, CaseStmt, Command, Expr, FileTestOp, ForLoop, IfStmt,
Pipeline, Program, Redirect, RedirectKind, SpannedPart, Stmt, StringPart, StringTestOp,
TestCmpOp, TestExpr, ToolDef, Value, VarPath, VarSegment, WhileLoop,
};
use crate::lexer::{self, HereDocData, Token};
use chumsky::{input::ValueInput, prelude::*};
pub type Span = SimpleSpan;
fn parse_var_expr(raw: &str) -> Expr {
if raw == "${?}" {
return Expr::LastExitCode;
}
if raw == "${$}" {
return Expr::CurrentPid;
}
if let Some(colon_idx) = find_default_separator(raw) {
let name = raw[2..colon_idx].to_string();
let default_str = &raw[colon_idx + 2..raw.len() - 1];
let default = parse_interpolated_string(&unquote_default_word(default_str));
return Expr::VarWithDefault { name, default };
}
Expr::VarRef(parse_varpath(raw))
}
fn unquote_default_word(word: &str) -> String {
let mut out = String::with_capacity(word.len());
let mut in_single = false;
let mut in_double = false;
for ch in word.chars() {
match ch {
'\'' if !in_double => in_single = !in_single,
'"' if !in_single => in_double = !in_double,
'$' if in_single => out.push_str("__KAISH_ESCAPED_DOLLAR__"),
_ => out.push(ch),
}
}
out
}
fn find_default_separator(raw: &str) -> Option<usize> {
let bytes = raw.as_bytes();
let mut depth = 0;
let mut i = 0;
while i < bytes.len() {
if i + 1 < bytes.len() && bytes[i] == b'$' && bytes[i + 1] == b'{' {
depth += 1;
i += 2;
continue;
}
if bytes[i] == b'}' && depth > 0 {
depth -= 1;
i += 1;
continue;
}
if depth == 1 && i + 1 < bytes.len() && bytes[i] == b':' && bytes[i + 1] == b'-' {
return Some(i);
}
i += 1;
}
None
}
fn find_default_separator_in_content(content: &str) -> Option<usize> {
let bytes = content.as_bytes();
let mut depth = 0;
let mut i = 0;
while i < bytes.len() {
if i + 1 < bytes.len() && bytes[i] == b'$' && bytes[i + 1] == b'{' {
depth += 1;
i += 2;
continue;
}
if bytes[i] == b'}' && depth > 0 {
depth -= 1;
i += 1;
continue;
}
if depth == 0 && i + 1 < bytes.len() && bytes[i] == b':' && bytes[i + 1] == b'-' {
return Some(i);
}
i += 1;
}
None
}
fn parse_varpath(raw: &str) -> VarPath {
let segments_strs = lexer::parse_var_ref(raw).unwrap_or_default();
let segments = segments_strs
.into_iter()
.filter(|s| !s.starts_with('[')) .map(VarSegment::Field)
.collect();
VarPath { segments }
}
fn stmt_to_pipeline(stmt: Stmt) -> Option<Pipeline> {
match stmt {
Stmt::Pipeline(p) => Some(p),
Stmt::Command(cmd) => Some(Pipeline {
commands: vec![cmd],
background: false,
}),
_ => None,
}
}
fn parse_interpolated_string_spanned(s: &str, base_offset: usize) -> Vec<SpannedPart> {
let s = s.replace("__KAISH_ESCAPED_DOLLAR__", "\x00DOLLAR\x00");
let chars_vec: Vec<char> = s.chars().collect();
let mut i = 0;
let mut pos: usize = 0;
let mut parts: Vec<SpannedPart> = Vec::new();
let mut current_text = String::new();
let mut current_text_start: usize = pos;
let push_literal =
|current_text: &mut String, start: &mut usize, end: usize, parts: &mut Vec<SpannedPart>| {
if !current_text.is_empty() {
parts.push(SpannedPart {
part: StringPart::Literal(std::mem::take(current_text)),
offset: base_offset + *start,
len: end - *start,
});
*start = end;
}
};
while i < chars_vec.len() {
let ch = chars_vec[i];
if ch == '\x00' {
let start = pos;
i += 1;
pos += 1;
let mut marker = String::new();
while let Some(&c) = chars_vec.get(i) {
if c == '\x00' {
i += 1;
pos += 1;
break;
}
marker.push(c);
i += 1;
pos += c.len_utf8();
}
if marker == "DOLLAR" {
if current_text.is_empty() {
current_text_start = start;
}
current_text.push('$');
}
} else if ch == '\\' {
let next = chars_vec.get(i + 1).copied();
match next {
Some('$') => {
if current_text.is_empty() {
current_text_start = pos;
}
current_text.push('$');
i += 2;
pos += 2;
}
Some('\\') => {
if current_text.is_empty() {
current_text_start = pos;
}
current_text.push('\\');
i += 2;
pos += 2;
}
Some('\n') => {
i += 2;
pos += 2;
if current_text.is_empty() {
current_text_start = pos;
}
}
Some('\r') => {
i += 2;
pos += 2;
if chars_vec.get(i) == Some(&'\n') {
i += 1;
pos += 1;
}
if current_text.is_empty() {
current_text_start = pos;
}
}
_ => {
if current_text.is_empty() {
current_text_start = pos;
}
current_text.push('\\');
i += 1;
pos += 1;
}
}
} else if ch == '$' {
let part_start = pos;
let next = chars_vec.get(i + 1).copied();
if next == Some('(') && chars_vec.get(i + 2) != Some(&'(') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
let mut cmd_content = String::new();
let mut depth = 1;
while let Some(&c) = chars_vec.get(i) {
i += 1;
pos += c.len_utf8();
if c == '(' {
depth += 1;
cmd_content.push(c);
} else if c == ')' {
depth -= 1;
if depth == 0 {
break;
}
cmd_content.push(c);
} else {
cmd_content.push(c);
}
}
let inserted = if let Ok(program) = parse(&cmd_content) {
if let Some(stmt) = program.statements.first() {
if let Some(pipeline) = stmt_to_pipeline(stmt.clone()) {
parts.push(SpannedPart {
part: StringPart::CommandSubst(pipeline),
offset: base_offset + part_start,
len: pos - part_start,
});
true
} else {
false
}
} else {
false
}
} else {
false
};
if inserted {
current_text_start = pos;
} else {
if current_text.is_empty() {
current_text_start = part_start;
}
current_text.push_str("$(");
current_text.push_str(&cmd_content);
current_text.push(')');
}
} else if next == Some('{') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
let mut var_content = String::new();
let mut depth = 1;
while let Some(&c) = chars_vec.get(i) {
i += 1;
pos += c.len_utf8();
if c == '{' && var_content.ends_with('$') {
depth += 1;
var_content.push(c);
} else if c == '}' {
depth -= 1;
if depth == 0 {
break;
}
var_content.push(c);
} else {
var_content.push(c);
}
}
let part = if let Some(name) = var_content.strip_prefix('#') {
StringPart::VarLength(name.to_string())
} else if var_content.starts_with("__ARITH:") && var_content.ends_with("__") {
let expr = var_content
.strip_prefix("__ARITH:")
.and_then(|s| s.strip_suffix("__"))
.unwrap_or("");
StringPart::Arithmetic(expr.to_string())
} else if let Some(colon_idx) = find_default_separator_in_content(&var_content) {
let name = var_content[..colon_idx].to_string();
let default_str = &var_content[colon_idx + 2..];
let default = parse_interpolated_string(&unquote_default_word(default_str));
StringPart::VarWithDefault { name, default }
} else {
StringPart::Var(parse_varpath(&format!("${{{}}}", var_content)))
};
parts.push(SpannedPart {
part,
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else if next.map(|c| c.is_ascii_digit()).unwrap_or(false) {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 1; pos += 1;
if let Some(&digit) = chars_vec.get(i) {
let n = digit.to_digit(10).unwrap_or(0) as usize;
i += 1;
pos += digit.len_utf8();
parts.push(SpannedPart {
part: StringPart::Positional(n),
offset: base_offset + part_start,
len: pos - part_start,
});
}
current_text_start = pos;
} else if next == Some('@') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
parts.push(SpannedPart {
part: StringPart::AllArgs,
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else if next == Some('#') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
parts.push(SpannedPart {
part: StringPart::ArgCount,
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else if next == Some('?') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
parts.push(SpannedPart {
part: StringPart::LastExitCode,
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else if next == Some('$') {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 2; pos += 2;
parts.push(SpannedPart {
part: StringPart::CurrentPid,
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else if next.map(|c| c.is_ascii_alphabetic() || c == '_').unwrap_or(false) {
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
i += 1; pos += 1;
let mut var_name = String::new();
while let Some(&c) = chars_vec.get(i) {
if c.is_ascii_alphanumeric() || c == '_' {
var_name.push(c);
i += 1;
pos += c.len_utf8();
} else {
break;
}
}
parts.push(SpannedPart {
part: StringPart::Var(VarPath::simple(var_name)),
offset: base_offset + part_start,
len: pos - part_start,
});
current_text_start = pos;
} else {
if current_text.is_empty() {
current_text_start = pos;
}
current_text.push(ch);
i += 1;
pos += 1;
}
} else {
if current_text.is_empty() {
current_text_start = pos;
}
current_text.push(ch);
i += 1;
pos += ch.len_utf8();
}
}
push_literal(&mut current_text, &mut current_text_start, pos, &mut parts);
parts
}
fn parse_interpolated_string(s: &str) -> Vec<StringPart> {
let s = s.replace("__KAISH_ESCAPED_DOLLAR__", "\x00DOLLAR\x00");
let mut parts = Vec::new();
let mut current_text = String::new();
let mut chars = s.chars().peekable();
while let Some(ch) = chars.next() {
if ch == '\x00' {
let mut marker = String::new();
while let Some(&c) = chars.peek() {
if c == '\x00' {
chars.next(); break;
}
if let Some(c) = chars.next() {
marker.push(c);
}
}
if marker == "DOLLAR" {
current_text.push('$');
}
} else if ch == '$' {
if chars.peek() == Some(&'(') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next();
let mut cmd_content = String::new();
let mut paren_depth = 1;
for c in chars.by_ref() {
if c == '(' {
paren_depth += 1;
cmd_content.push(c);
} else if c == ')' {
paren_depth -= 1;
if paren_depth == 0 {
break;
}
cmd_content.push(c);
} else {
cmd_content.push(c);
}
}
if let Ok(program) = parse(&cmd_content) {
if let Some(stmt) = program.statements.first() {
if let Some(pipeline) = stmt_to_pipeline(stmt.clone()) {
parts.push(StringPart::CommandSubst(pipeline));
} else {
current_text.push_str("$(");
current_text.push_str(&cmd_content);
current_text.push(')');
}
}
} else {
current_text.push_str("$(");
current_text.push_str(&cmd_content);
current_text.push(')');
}
} else if chars.peek() == Some(&'{') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next();
let mut var_content = String::new();
let mut depth = 1;
for c in chars.by_ref() {
if c == '{' && var_content.ends_with('$') {
depth += 1;
var_content.push(c);
} else if c == '}' {
depth -= 1;
if depth == 0 {
break;
}
var_content.push(c);
} else {
var_content.push(c);
}
}
let part = if let Some(name) = var_content.strip_prefix('#') {
StringPart::VarLength(name.to_string())
} else if var_content.starts_with("__ARITH:") && var_content.ends_with("__") {
let expr = var_content
.strip_prefix("__ARITH:")
.and_then(|s| s.strip_suffix("__"))
.unwrap_or("");
StringPart::Arithmetic(expr.to_string())
} else if let Some(colon_idx) = find_default_separator_in_content(&var_content) {
let name = var_content[..colon_idx].to_string();
let default_str = &var_content[colon_idx + 2..];
let default = parse_interpolated_string(&unquote_default_word(default_str));
StringPart::VarWithDefault { name, default }
} else {
StringPart::Var(parse_varpath(&format!("${{{}}}", var_content)))
};
parts.push(part);
} else if chars.peek().map(|c| c.is_ascii_digit()).unwrap_or(false) {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
if let Some(digit) = chars.next() {
let n = digit.to_digit(10).unwrap_or(0) as usize;
parts.push(StringPart::Positional(n));
}
} else if chars.peek() == Some(&'@') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next(); parts.push(StringPart::AllArgs);
} else if chars.peek() == Some(&'#') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next(); parts.push(StringPart::ArgCount);
} else if chars.peek() == Some(&'?') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next(); parts.push(StringPart::LastExitCode);
} else if chars.peek() == Some(&'$') {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
chars.next(); parts.push(StringPart::CurrentPid);
} else if chars.peek().map(|c| c.is_ascii_alphabetic() || *c == '_').unwrap_or(false) {
if !current_text.is_empty() {
parts.push(StringPart::Literal(std::mem::take(&mut current_text)));
}
let mut var_name = String::new();
while let Some(&c) = chars.peek() {
if c.is_ascii_alphanumeric() || c == '_' {
if let Some(c) = chars.next() {
var_name.push(c);
}
} else {
break;
}
}
parts.push(StringPart::Var(VarPath::simple(var_name)));
} else {
current_text.push(ch);
}
} else {
current_text.push(ch);
}
}
if !current_text.is_empty() {
parts.push(StringPart::Literal(current_text));
}
parts
}
#[derive(Debug, Clone)]
pub struct ParseError {
pub span: Span,
pub message: String,
}
impl ParseError {
pub fn format(&self, source: &str) -> String {
let start = self.span.start;
let mut line = 1usize;
let mut col = 1usize;
for (i, ch) in source.char_indices() {
if i >= start {
break;
}
if ch == '\n' {
line += 1;
col = 1;
} else {
col += 1;
}
}
let line_content = {
let line_start = source[..start.min(source.len())]
.rfind('\n')
.map_or(0, |i| i + 1);
let line_end = source[start.min(source.len())..]
.find('\n')
.map_or(source.len(), |i| start + i);
source.get(line_start..line_end).unwrap_or("")
};
if line_content.is_empty() {
format!("{}:{} [parse]: {}", line, col, self.message)
} else {
format!(
"{}:{} [parse]: {}\n | {}",
line, col, self.message, line_content
)
}
}
}
impl std::fmt::Display for ParseError {
fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
write!(f, "{} at {:?}", self.message, self.span)
}
}
impl std::error::Error for ParseError {}
pub fn parse(source: &str) -> Result<Program, Vec<ParseError>> {
let tokens = lexer::tokenize(source).map_err(|errs| {
errs.into_iter()
.map(|e| ParseError {
span: (e.span.start..e.span.end).into(),
message: format!("lexer error: {}", e.token),
})
.collect::<Vec<_>>()
})?;
let tokens: Vec<(Token, Span)> = tokens
.into_iter()
.map(|spanned| (spanned.token, (spanned.span.start..spanned.span.end).into()))
.collect();
let end_span: Span = (source.len()..source.len()).into();
let parser = program_parser();
let result = parser.parse(tokens.as_slice().map(end_span, |(t, s)| (t, s)));
let program = result.into_result().map_err(|errs| {
errs.into_iter()
.map(|e| ParseError {
span: *e.span(),
message: e.to_string(),
})
.collect::<Vec<_>>()
})?;
if first_ambiguous_stdin(&program.statements) {
return Err(vec![ParseError {
span: (0..0).into(),
message: "multiple stdin redirects on one command are ambiguous; \
use exactly one of `<`, `<<`, or `<<<`"
.to_string(),
}]);
}
Ok(program)
}
pub fn parse_statement(source: &str) -> Result<Stmt, Vec<ParseError>> {
let program = parse(source)?;
program
.statements
.into_iter()
.find(|s| !matches!(s, Stmt::Empty))
.ok_or_else(|| {
vec![ParseError {
span: (0..source.len()).into(),
message: "empty input".to_string(),
}]
})
}
fn program_parser<'tokens, 'src: 'tokens, I>(
) -> impl Parser<'tokens, I, Program, extra::Err<Rich<'tokens, Token, Span>>>
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
statement_parser()
.repeated()
.collect::<Vec<_>>()
.map(|statements| Program { statements })
}
fn statement_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
recursive(|stmt| {
let terminator = choice((just(Token::Newline), just(Token::Semi))).repeated();
let break_stmt = just(Token::Break)
.ignore_then(
select! { Token::Int(n) => n as usize }.or_not()
)
.map(Stmt::Break);
let continue_stmt = just(Token::Continue)
.ignore_then(
select! { Token::Int(n) => n as usize }.or_not()
)
.map(Stmt::Continue);
let return_stmt = just(Token::Return)
.ignore_then(primary_expr_parser().or_not())
.map(|e| Stmt::Return(e.map(Box::new)));
let exit_stmt = just(Token::Exit)
.ignore_then(primary_expr_parser().or_not())
.map(|e| Stmt::Exit(e.map(Box::new)));
let set_flag_arg = choice((
select! { Token::ShortFlag(f) => Arg::ShortFlag(f) },
select! { Token::LongFlag(f) => Arg::LongFlag(f) },
select! { Token::PlusFlag(f) => Arg::Positional(Expr::Literal(Value::String(format!("+{}", f)))) },
));
let option_value_str = select! {
Token::NumberIdent(s) => s,
Token::Int(n) => n.to_string(),
Token::Ident(s) => s,
};
let set_option_assign = ident_parser()
.then_ignore(just(Token::Eq))
.then(option_value_str)
.map(|(name, value)| {
Arg::Positional(Expr::Literal(Value::String(format!("{name}={value}"))))
});
let set_quoted_arg = select! {
Token::String(s) => Arg::Positional(Expr::Literal(Value::String(s))),
Token::SingleString(s) => Arg::Positional(Expr::Literal(Value::String(s))),
};
let set_with_flags = just(Token::Set)
.then(set_flag_arg)
.then(
choice((
set_flag_arg,
set_option_assign,
set_quoted_arg,
ident_parser().map(|name| Arg::Positional(Expr::Literal(Value::String(name)))),
))
.repeated()
.collect::<Vec<_>>(),
)
.map(|((_, first_arg), mut rest_args)| {
let mut args = vec![first_arg];
args.append(&mut rest_args);
Stmt::Command(Command {
name: "set".to_string(),
args,
redirects: vec![],
})
});
let set_no_args = just(Token::Set)
.then(
choice((
just(Token::Newline).to(()),
just(Token::Semi).to(()),
just(Token::And).to(()),
just(Token::Or).to(()),
end(),
))
.rewind(),
)
.map(|_| Stmt::Command(Command {
name: "set".to_string(),
args: vec![],
redirects: vec![],
}));
let set_command = set_with_flags.or(set_no_args);
let base_statement = choice((
just(Token::Newline).to(Stmt::Empty),
set_command,
assignment_parser().map(Stmt::Assignment),
posix_function_parser(stmt.clone()).map(Stmt::ToolDef), bash_function_parser(stmt.clone()).map(Stmt::ToolDef), if_parser(stmt.clone()).map(Stmt::If),
for_parser(stmt.clone()).map(Stmt::For),
while_parser(stmt.clone()).map(Stmt::While),
case_parser(stmt.clone()).map(Stmt::Case),
break_stmt,
continue_stmt,
return_stmt,
exit_stmt,
test_expr_stmt_parser().map(Stmt::Test),
pipeline_parser().map(|p| {
if p.commands.len() == 1 && !p.background {
if p.commands[0].redirects.is_empty() {
match p.commands.into_iter().next() {
Some(cmd) => Stmt::Command(cmd),
None => Stmt::Empty, }
} else {
Stmt::Pipeline(p)
}
} else {
Stmt::Pipeline(p)
}
}),
))
.boxed();
let and_chain = base_statement
.clone()
.foldl(
just(Token::And).ignore_then(base_statement).repeated(),
|left, right| Stmt::AndChain {
left: Box::new(left),
right: Box::new(right),
},
);
and_chain
.clone()
.foldl(
just(Token::Or).ignore_then(and_chain).repeated(),
|left, right| Stmt::OrChain {
left: Box::new(left),
right: Box::new(right),
},
)
.then_ignore(terminator)
})
}
fn assignment_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Assignment, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let local_assignment = just(Token::Local)
.ignore_then(ident_parser())
.then_ignore(just(Token::Eq))
.then(expr_parser())
.map(|(name, value)| Assignment {
name,
value,
local: true,
});
let bash_assignment = ident_parser()
.then_ignore(just(Token::Eq))
.then(expr_parser())
.map(|(name, value)| Assignment {
name,
value,
local: false,
});
choice((local_assignment, bash_assignment))
.labelled("assignment")
.boxed()
}
fn posix_function_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, ToolDef, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
ident_parser()
.then_ignore(just(Token::LParen))
.then_ignore(just(Token::RParen))
.then_ignore(just(Token::LBrace))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.repeated()
.collect::<Vec<_>>()
.map(|stmts| stmts.into_iter().filter(|s| !matches!(s, Stmt::Empty)).collect()),
)
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::RBrace))
.map(|(name, body)| ToolDef { name, params: vec![], body })
.labelled("POSIX function")
.boxed()
}
fn bash_function_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, ToolDef, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
just(Token::Function)
.ignore_then(ident_parser())
.then_ignore(just(Token::LBrace))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.repeated()
.collect::<Vec<_>>()
.map(|stmts| stmts.into_iter().filter(|s| !matches!(s, Stmt::Empty)).collect()),
)
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::RBrace))
.map(|(name, body)| ToolDef { name, params: vec![], body })
.labelled("bash function")
.boxed()
}
fn if_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, IfStmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
let branch = condition_parser()
.then_ignore(just(Token::Semi).or_not())
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::Then))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.clone()
.repeated()
.collect::<Vec<_>>()
.map(|stmts: Vec<Stmt>| {
stmts
.into_iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect::<Vec<_>>()
}),
);
let elif_branch = just(Token::Elif)
.ignore_then(condition_parser())
.then_ignore(just(Token::Semi).or_not())
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::Then))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.clone()
.repeated()
.collect::<Vec<_>>()
.map(|stmts: Vec<Stmt>| {
stmts
.into_iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect::<Vec<_>>()
}),
);
let else_branch = just(Token::Else)
.ignore_then(just(Token::Newline).repeated())
.ignore_then(stmt.repeated().collect::<Vec<_>>())
.map(|stmts: Vec<Stmt>| {
stmts
.into_iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect::<Vec<_>>()
});
just(Token::If)
.ignore_then(branch)
.then(elif_branch.repeated().collect::<Vec<_>>())
.then(else_branch.or_not())
.then_ignore(just(Token::Fi))
.map(|(((condition, then_branch), elif_branches), else_branch)| {
build_if_chain(condition, then_branch, elif_branches, else_branch)
})
.labelled("if statement")
.boxed()
}
fn build_if_chain(
condition: Expr,
then_branch: Vec<Stmt>,
mut elif_branches: Vec<(Expr, Vec<Stmt>)>,
else_branch: Option<Vec<Stmt>>,
) -> IfStmt {
if elif_branches.is_empty() {
IfStmt {
condition: Box::new(condition),
then_branch,
else_branch,
}
} else {
let (elif_cond, elif_then) = elif_branches.remove(0);
let nested_if = build_if_chain(elif_cond, elif_then, elif_branches, else_branch);
IfStmt {
condition: Box::new(condition),
then_branch,
else_branch: Some(vec![Stmt::If(nested_if)]),
}
}
}
fn for_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, ForLoop, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
just(Token::For)
.ignore_then(ident_parser())
.then_ignore(just(Token::In))
.then(expr_parser().repeated().at_least(1).collect::<Vec<_>>())
.then_ignore(just(Token::Semi).or_not())
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::Do))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.repeated()
.collect::<Vec<_>>()
.map(|stmts| stmts.into_iter().filter(|s| !matches!(s, Stmt::Empty)).collect()),
)
.then_ignore(just(Token::Done))
.map(|((variable, items), body)| ForLoop {
variable,
items,
body,
})
.labelled("for loop")
.boxed()
}
fn while_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, WhileLoop, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
just(Token::While)
.ignore_then(condition_parser())
.then_ignore(just(Token::Semi).or_not())
.then_ignore(just(Token::Newline).repeated())
.then_ignore(just(Token::Do))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.repeated()
.collect::<Vec<_>>()
.map(|stmts| stmts.into_iter().filter(|s| !matches!(s, Stmt::Empty)).collect()),
)
.then_ignore(just(Token::Done))
.map(|(condition, body)| WhileLoop {
condition: Box::new(condition),
body,
})
.labelled("while loop")
.boxed()
}
fn case_parser<'tokens, I, S>(
stmt: S,
) -> impl Parser<'tokens, I, CaseStmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
S: Parser<'tokens, I, Stmt, extra::Err<Rich<'tokens, Token, Span>>> + Clone + 'tokens,
{
let pattern_part = choice((
select! { Token::GlobWord(s) => s },
select! { Token::Ident(s) => s },
select! { Token::NumberIdent(s) => s },
select! { Token::DottedIdent(s) => s },
select! { Token::String(s) => s },
select! { Token::SingleString(s) => s },
select! { Token::Int(n) => n.to_string() },
select! { Token::Star => "*".to_string() },
select! { Token::Question => "?".to_string() },
select! { Token::Dot => ".".to_string() },
select! { Token::DotDot => "..".to_string() },
select! { Token::Tilde => "~".to_string() },
select! { Token::TildePath(s) => s },
select! { Token::RelativePath(s) => s },
select! { Token::DotSlashPath(s) => s },
select! { Token::Path(p) => p },
select! { Token::VarRef(v) => v },
select! { Token::SimpleVarRef(v) => format!("${}", v) },
just(Token::LBracket)
.ignore_then(
choice((
select! { Token::Ident(s) => s },
select! { Token::Int(n) => n.to_string() },
just(Token::Colon).to(":".to_string()),
just(Token::Bang).to("!".to_string()),
select! { Token::ShortFlag(s) => format!("-{}", s) },
))
.repeated()
.at_least(1)
.collect::<Vec<String>>()
)
.then_ignore(just(Token::RBracket))
.map(|parts| format!("[{}]", parts.join(""))),
just(Token::LBrace)
.ignore_then(
choice((
select! { Token::Ident(s) => s },
select! { Token::Int(n) => n.to_string() },
))
.separated_by(just(Token::Comma))
.at_least(1)
.collect::<Vec<String>>()
)
.then_ignore(just(Token::RBrace))
.map(|parts| format!("{{{}}}", parts.join(","))),
));
let pattern = pattern_part
.repeated()
.at_least(1)
.collect::<Vec<String>>()
.map(|parts| parts.join(""))
.labelled("case pattern");
let patterns = pattern
.separated_by(just(Token::Pipe))
.at_least(1)
.collect::<Vec<String>>()
.labelled("case patterns");
let branch = just(Token::LParen)
.or_not()
.ignore_then(just(Token::Newline).repeated())
.ignore_then(patterns)
.then_ignore(just(Token::RParen))
.then_ignore(just(Token::Newline).repeated())
.then(
stmt.clone()
.repeated()
.collect::<Vec<_>>()
.map(|stmts| stmts.into_iter().filter(|s| !matches!(s, Stmt::Empty)).collect()),
)
.then_ignore(just(Token::DoubleSemi))
.then_ignore(just(Token::Newline).repeated())
.map(|(patterns, body)| CaseBranch { patterns, body })
.labelled("case branch");
just(Token::Case)
.ignore_then(expr_parser())
.then_ignore(just(Token::In))
.then_ignore(just(Token::Newline).repeated())
.then(branch.repeated().collect::<Vec<_>>())
.then_ignore(just(Token::Esac))
.map(|(expr, branches)| CaseStmt { expr, branches })
.labelled("case statement")
.boxed()
}
fn pipeline_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Pipeline, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
command_parser()
.separated_by(just(Token::Pipe))
.at_least(1)
.collect::<Vec<_>>()
.then(just(Token::Amp).or_not())
.map(|(commands, bg)| Pipeline {
commands,
background: bg.is_some(),
})
.labelled("pipeline")
.boxed()
}
fn command_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Command, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let command_name = choice((
ident_parser(),
path_parser(),
select! { Token::DotSlashPath(s) => s },
just(Token::True).to("true".to_string()),
just(Token::False).to("false".to_string()),
just(Token::Dot).to(".".to_string()),
));
command_name
.then(args_list_parser())
.then(redirect_parser().repeated().collect::<Vec<_>>())
.map(|((name, args), redirects)| Command {
name,
args,
redirects,
})
.labelled("command")
.boxed()
}
fn command_has_ambiguous_stdin(cmd: &Command) -> bool {
cmd.redirects
.iter()
.filter(|r| {
matches!(
r.kind,
RedirectKind::Stdin | RedirectKind::HereDoc | RedirectKind::HereString
)
})
.count()
> 1
}
fn first_ambiguous_stdin(stmts: &[Stmt]) -> bool {
stmts.iter().any(stmt_has_ambiguous_stdin)
}
fn stmt_has_ambiguous_stdin(stmt: &Stmt) -> bool {
match stmt {
Stmt::Command(c) => command_has_ambiguous_stdin(c),
Stmt::Pipeline(p) => p.commands.iter().any(command_has_ambiguous_stdin),
Stmt::If(i) => {
first_ambiguous_stdin(&i.then_branch)
|| i.else_branch
.as_deref()
.is_some_and(first_ambiguous_stdin)
}
Stmt::For(f) => first_ambiguous_stdin(&f.body),
Stmt::While(w) => first_ambiguous_stdin(&w.body),
Stmt::Case(c) => c.branches.iter().any(|b| first_ambiguous_stdin(&b.body)),
Stmt::ToolDef(t) => first_ambiguous_stdin(&t.body),
Stmt::AndChain { left, right } | Stmt::OrChain { left, right } => {
stmt_has_ambiguous_stdin(left) || stmt_has_ambiguous_stdin(right)
}
Stmt::Assignment(_)
| Stmt::Break(_)
| Stmt::Continue(_)
| Stmt::Return(_)
| Stmt::Exit(_)
| Stmt::Test(_)
| Stmt::Empty => false,
}
}
fn args_list_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Vec<Arg>, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let pre_dash = arg_before_double_dash_parser()
.repeated()
.collect::<Vec<_>>();
let double_dash = select! {
Token::DoubleDash => Arg::DoubleDash,
};
let post_dash_arg = choice((
select! {
Token::ShortFlag(name) => Arg::Positional(Expr::Literal(Value::String(format!("-{}", name)))),
Token::LongFlag(name) => Arg::Positional(Expr::Literal(Value::String(format!("--{}", name)))),
},
primary_expr_parser().map(Arg::Positional),
));
let post_dash = post_dash_arg.repeated().collect::<Vec<_>>();
pre_dash
.then(double_dash.then(post_dash).or_not())
.map(|(mut args, maybe_dd)| {
if let Some((dd, post)) = maybe_dd {
args.push(dd);
args.extend(post);
}
args
})
}
fn arg_before_double_dash_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Arg, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let long_flag_with_value = select! {
Token::LongFlag(name) => name,
}
.then_ignore(just(Token::Eq))
.then(primary_expr_parser())
.map(|(key, value)| Arg::Named { key, value });
let long_flag = select! {
Token::LongFlag(name) => Arg::LongFlag(name),
};
let short_flag = select! {
Token::ShortFlag(name) => Arg::ShortFlag(name),
};
let named = select! {
Token::Ident(s) => s,
}
.map_with(|s, e| -> (String, Span) { (s, e.span()) })
.then(just(Token::Eq).map_with(|_, e| -> Span { e.span() }))
.then(primary_expr_parser().map_with(|expr, e| -> (Expr, Span) { (expr, e.span()) }))
.try_map(|(((key, key_span), eq_span), (value, value_span)): (((String, Span), Span), (Expr, Span)), span| {
if key_span.end != eq_span.start || eq_span.end != value_span.start {
Err(Rich::custom(
span,
"shell assignment must not have spaces around '=' (use 'key=value' not 'key = value')",
))
} else {
Ok(Arg::WordAssign { key, value })
}
});
let positional = primary_expr_parser().map(Arg::Positional);
choice((
long_flag_with_value,
long_flag,
short_flag,
named,
positional,
))
.boxed()
}
fn redirect_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Redirect, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let regular_redirect = select! {
Token::GtGt => RedirectKind::StdoutAppend,
Token::Gt => RedirectKind::StdoutOverwrite,
Token::Lt => RedirectKind::Stdin,
Token::Stderr => RedirectKind::Stderr,
Token::Both => RedirectKind::Both,
}
.then(primary_expr_parser())
.map(|(kind, target)| Redirect { kind, target });
let heredoc_redirect = just(Token::HereDocStart)
.ignore_then(select! { Token::HereDoc(data) => data })
.map(|data: HereDocData| {
let target = if data.literal {
let body = if data.strip_tabs {
crate::interpreter::strip_leading_tabs(&data.content)
} else {
data.content
};
Expr::Literal(Value::String(body))
} else {
let parts = parse_interpolated_string_spanned(
&data.content,
data.body_start_offset,
);
if parts.len() == 1 && !data.strip_tabs {
if let StringPart::Literal(text) = &parts[0].part {
return Redirect {
kind: RedirectKind::HereDoc,
target: Expr::Literal(Value::String(text.clone())),
};
}
}
Expr::HereDocBody {
parts,
strip_tabs: data.strip_tabs,
}
};
Redirect {
kind: RedirectKind::HereDoc,
target,
}
});
let herestring_redirect = just(Token::HereString)
.ignore_then(primary_expr_parser())
.map(|target| Redirect {
kind: RedirectKind::HereString,
target,
});
let merge_stderr_redirect = just(Token::StderrToStdout)
.map(|_| Redirect {
kind: RedirectKind::MergeStderr,
target: Expr::Literal(Value::Null),
});
let merge_stdout_redirect = choice((
just(Token::StdoutToStderr),
just(Token::StdoutToStderr2),
))
.map(|_| Redirect {
kind: RedirectKind::MergeStdout,
target: Expr::Literal(Value::Null),
});
choice((
heredoc_redirect,
herestring_redirect,
merge_stderr_redirect,
merge_stdout_redirect,
regular_redirect,
))
.labelled("redirect")
.boxed()
}
fn test_expr_stmt_parser<'tokens, I>(
) -> impl Parser<'tokens, I, TestExpr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let file_test_op = select! {
Token::ShortFlag(s) if s == "e" => FileTestOp::Exists,
Token::ShortFlag(s) if s == "f" => FileTestOp::IsFile,
Token::ShortFlag(s) if s == "d" => FileTestOp::IsDir,
Token::ShortFlag(s) if s == "r" => FileTestOp::Readable,
Token::ShortFlag(s) if s == "w" => FileTestOp::Writable,
Token::ShortFlag(s) if s == "x" => FileTestOp::Executable,
};
let string_test_op = select! {
Token::ShortFlag(s) if s == "z" => StringTestOp::IsEmpty,
Token::ShortFlag(s) if s == "n" => StringTestOp::IsNonEmpty,
};
let cmp_op = choice((
just(Token::EqEq).to(TestCmpOp::Eq),
just(Token::Eq).to(TestCmpOp::Eq),
just(Token::NotEq).to(TestCmpOp::NotEq),
just(Token::Match).to(TestCmpOp::Match),
just(Token::NotMatch).to(TestCmpOp::NotMatch),
just(Token::Gt).to(TestCmpOp::Gt),
just(Token::Lt).to(TestCmpOp::Lt),
just(Token::GtEq).to(TestCmpOp::GtEq),
just(Token::LtEq).to(TestCmpOp::LtEq),
select! { Token::ShortFlag(s) if s == "eq" => TestCmpOp::NumEq },
select! { Token::ShortFlag(s) if s == "ne" => TestCmpOp::NumNotEq },
select! { Token::ShortFlag(s) if s == "gt" => TestCmpOp::NumGt },
select! { Token::ShortFlag(s) if s == "lt" => TestCmpOp::NumLt },
select! { Token::ShortFlag(s) if s == "ge" => TestCmpOp::NumGtEq },
select! { Token::ShortFlag(s) if s == "le" => TestCmpOp::NumLtEq },
));
let file_test = file_test_op
.then(primary_expr_parser())
.map(|(op, path)| TestExpr::FileTest {
op,
path: Box::new(path),
});
let string_test = string_test_op
.then(primary_expr_parser())
.map(|(op, value)| TestExpr::StringTest {
op,
value: Box::new(value),
});
let comparison = primary_expr_parser()
.then(cmp_op)
.then(primary_expr_parser())
.map(|((left, op), right)| TestExpr::Comparison {
left: Box::new(left),
op,
right: Box::new(right),
});
let primary_test = choice((file_test, string_test, comparison));
let unary = recursive(|unary| {
let not_expr = just(Token::Bang)
.ignore_then(unary)
.map(|expr| TestExpr::Not { expr: Box::new(expr) });
choice((not_expr, primary_test.clone()))
});
let and_expr = unary.clone().foldl(
just(Token::And).ignore_then(unary).repeated(),
|left, right| TestExpr::And {
left: Box::new(left),
right: Box::new(right),
},
);
let compound_test = and_expr.clone().foldl(
just(Token::Or).ignore_then(and_expr).repeated(),
|left, right| TestExpr::Or {
left: Box::new(left),
right: Box::new(right),
},
);
just(Token::LBracket)
.then(just(Token::LBracket))
.ignore_then(compound_test)
.then_ignore(just(Token::RBracket).then(just(Token::RBracket)))
.labelled("test expression")
.boxed()
}
fn condition_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let test_expr_condition = test_expr_stmt_parser().map(|test| Expr::Test(Box::new(test)));
let command_condition = command_parser().map(Expr::Command);
let base = choice((test_expr_condition, command_condition));
let and_expr = base.clone().foldl(
just(Token::And).ignore_then(base).repeated(),
|left, right| Expr::BinaryOp {
left: Box::new(left),
op: BinaryOp::And,
right: Box::new(right),
},
);
and_expr
.clone()
.foldl(
just(Token::Or).ignore_then(and_expr).repeated(),
|left, right| Expr::BinaryOp {
left: Box::new(left),
op: BinaryOp::Or,
right: Box::new(right),
},
)
.labelled("condition")
.boxed()
}
fn expr_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
primary_expr_parser()
}
fn primary_expr_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let positional = select! {
Token::Positional(n) => Expr::Positional(n),
Token::AllArgs => Expr::AllArgs,
Token::ArgCount => Expr::ArgCount,
Token::VarLength(name) => Expr::VarLength(name),
Token::LastExitCode => Expr::LastExitCode,
Token::CurrentPid => Expr::CurrentPid,
};
let arithmetic = select! {
Token::Arithmetic(expr_str) => Expr::Arithmetic(expr_str),
};
let keyword_as_bareword = select! {
Token::Done => "done",
Token::Fi => "fi",
Token::Then => "then",
Token::Else => "else",
Token::Elif => "elif",
Token::In => "in",
Token::Do => "do",
Token::Esac => "esac",
Token::Set => "set",
}
.map(|s| Expr::Literal(Value::String(s.to_string())));
let plus_minus_bare = select! {
Token::PlusBare(s) => Expr::Literal(Value::String(s)),
Token::MinusBare(s) => Expr::Literal(Value::String(s)),
Token::MinusAlone => Expr::Literal(Value::String("-".to_string())),
};
let glob_pattern = select! {
Token::GlobWord(s) => Expr::GlobPattern(s),
Token::Star => Expr::GlobPattern("*".to_string()),
Token::Question => Expr::GlobPattern("?".to_string()),
};
recursive(|expr| {
choice((
positional,
arithmetic,
cmd_subst_parser(expr.clone()),
var_expr_parser(),
interpolated_string_parser(),
literal_parser().map(Expr::Literal),
glob_pattern,
ident_parser().map(|s| Expr::Literal(Value::String(s))),
path_parser().map(|s| Expr::Literal(Value::String(s))),
select! {
Token::Dot => Expr::Literal(Value::String(".".into())),
Token::DotDot => Expr::Literal(Value::String("..".into())),
Token::Tilde => Expr::Literal(Value::String("~".into())),
Token::TildePath(s) => Expr::Literal(Value::String(s)),
Token::RelativePath(s) => Expr::Literal(Value::String(s)),
Token::DotSlashPath(s) => Expr::Literal(Value::String(s)),
Token::NumberIdent(s) => Expr::Literal(Value::String(s)),
Token::DottedIdent(s) => Expr::Literal(Value::String(s)),
Token::JobSpec(s) => Expr::Literal(Value::String(s)),
},
plus_minus_bare,
keyword_as_bareword,
))
.labelled("expression")
})
.boxed()
}
fn var_expr_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
select! {
Token::VarRef(raw) => parse_var_expr(&raw),
Token::SimpleVarRef(name) => Expr::VarRef(VarPath::simple(name)),
}
.labelled("variable reference")
}
fn cmd_subst_parser<'tokens, I, E>(
expr: E,
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
E: Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone,
{
let long_flag_with_value = select! {
Token::LongFlag(name) => name,
}
.then_ignore(just(Token::Eq))
.then(expr.clone())
.map(|(key, value)| Arg::Named { key, value });
let long_flag = select! {
Token::LongFlag(name) => Arg::LongFlag(name),
};
let short_flag = select! {
Token::ShortFlag(name) => Arg::ShortFlag(name),
};
let named = ident_parser()
.then_ignore(just(Token::Eq))
.then(expr.clone())
.map(|(key, value)| Arg::WordAssign { key, value });
let positional = expr.map(Arg::Positional);
let arg = choice((
long_flag_with_value,
long_flag,
short_flag,
named,
positional,
));
let command_name = choice((
ident_parser(),
just(Token::True).to("true".to_string()),
just(Token::False).to("false".to_string()),
));
let command = command_name
.then(arg.repeated().collect::<Vec<_>>())
.map(|(name, args)| Command {
name,
args,
redirects: vec![],
});
let pipeline = command
.separated_by(just(Token::Pipe))
.at_least(1)
.collect::<Vec<_>>()
.map(|commands| Pipeline {
commands,
background: false,
});
just(Token::CmdSubstStart)
.ignore_then(pipeline)
.then_ignore(just(Token::RParen))
.map(|pipeline| Expr::CommandSubst(Box::new(pipeline)))
.labelled("command substitution")
}
fn interpolated_string_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Expr, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
let double_quoted = select! {
Token::String(s) => s,
}
.map(|s| {
if s.contains('$') || s.contains("__KAISH_ESCAPED_DOLLAR__") {
let parts = parse_interpolated_string(&s);
if parts.len() == 1
&& let StringPart::Literal(text) = &parts[0] {
return Expr::Literal(Value::String(text.clone()));
}
Expr::Interpolated(parts)
} else {
Expr::Literal(Value::String(s))
}
});
let single_quoted = select! {
Token::SingleString(s) => Expr::Literal(Value::String(s)),
};
choice((single_quoted, double_quoted)).labelled("string")
}
fn literal_parser<'tokens, I>(
) -> impl Parser<'tokens, I, Value, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
choice((
select! {
Token::True => Value::Bool(true),
Token::False => Value::Bool(false),
},
select! {
Token::Int(n) => Value::Int(n),
Token::Float(f) => Value::Float(f),
},
))
.labelled("literal")
.boxed()
}
fn ident_parser<'tokens, I>(
) -> impl Parser<'tokens, I, String, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
select! {
Token::Ident(s) => s,
}
.labelled("identifier")
}
fn path_parser<'tokens, I>(
) -> impl Parser<'tokens, I, String, extra::Err<Rich<'tokens, Token, Span>>> + Clone
where
I: ValueInput<'tokens, Token = Token, Span = Span>,
{
select! {
Token::Path(s) => s,
}
.labelled("path")
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn parse_empty() {
let result = parse("");
assert!(result.is_ok());
assert_eq!(result.expect("ok").statements.len(), 0);
}
#[test]
fn parse_newlines_only() {
let result = parse("\n\n\n");
assert!(result.is_ok());
}
#[test]
fn parse_simple_command() {
let result = parse("echo");
assert!(result.is_ok());
let program = result.expect("ok");
assert_eq!(program.statements.len(), 1);
assert!(matches!(&program.statements[0], Stmt::Command(_)));
}
#[test]
fn parse_command_with_string_arg() {
let result = parse(r#"echo "hello""#);
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => assert_eq!(cmd.args.len(), 1),
_ => panic!("expected Command"),
}
}
#[test]
fn parse_assignment() {
let result = parse("X=5");
assert!(result.is_ok());
let program = result.expect("ok");
assert!(matches!(&program.statements[0], Stmt::Assignment(_)));
}
#[test]
fn parse_pipeline() {
let result = parse("a | b | c");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Pipeline(p) => assert_eq!(p.commands.len(), 3),
_ => panic!("expected Pipeline"),
}
}
#[test]
fn parse_background_job() {
let result = parse("cmd &");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Pipeline(p) => assert!(p.background),
_ => panic!("expected Pipeline with background"),
}
}
#[test]
fn parse_if_simple() {
let result = parse("if true; then echo; fi");
assert!(result.is_ok());
let program = result.expect("ok");
assert!(matches!(&program.statements[0], Stmt::If(_)));
}
#[test]
fn parse_if_else() {
let result = parse("if true; then echo; else echo; fi");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::If(if_stmt) => assert!(if_stmt.else_branch.is_some()),
_ => panic!("expected If"),
}
}
#[test]
fn parse_elif_simple() {
let result = parse("if true; then echo a; elif false; then echo b; fi");
assert!(result.is_ok(), "parse failed: {:?}", result);
let program = result.expect("ok");
match &program.statements[0] {
Stmt::If(if_stmt) => {
assert!(if_stmt.else_branch.is_some());
let else_branch = if_stmt.else_branch.as_ref().unwrap();
assert_eq!(else_branch.len(), 1);
assert!(matches!(&else_branch[0], Stmt::If(_)));
}
_ => panic!("expected If"),
}
}
#[test]
fn parse_elif_with_else() {
let result = parse("if true; then echo a; elif false; then echo b; else echo c; fi");
assert!(result.is_ok(), "parse failed: {:?}", result);
let program = result.expect("ok");
match &program.statements[0] {
Stmt::If(outer_if) => {
let else_branch = outer_if.else_branch.as_ref().expect("outer else");
assert_eq!(else_branch.len(), 1);
match &else_branch[0] {
Stmt::If(inner_if) => {
assert!(inner_if.else_branch.is_some());
}
_ => panic!("expected nested If from elif"),
}
}
_ => panic!("expected If"),
}
}
#[test]
fn parse_multiple_elif() {
let result = parse(
"if [[ ${X} == 1 ]]; then echo one; elif [[ ${X} == 2 ]]; then echo two; elif [[ ${X} == 3 ]]; then echo three; else echo other; fi",
);
assert!(result.is_ok(), "parse failed: {:?}", result);
}
#[test]
fn parse_for_loop() {
let result = parse("for X in items; do echo; done");
assert!(result.is_ok());
let program = result.expect("ok");
assert!(matches!(&program.statements[0], Stmt::For(_)));
}
#[test]
fn parse_brackets_not_array_literal() {
let result = parse("cmd [1");
let _ = result;
}
#[test]
fn parse_named_arg() {
let result = parse("cmd foo=5");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.args.len(), 1);
assert!(matches!(&cmd.args[0], Arg::WordAssign { .. }));
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_short_flag() {
let result = parse("ls -l");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "ls");
assert_eq!(cmd.args.len(), 1);
match &cmd.args[0] {
Arg::ShortFlag(name) => assert_eq!(name, "l"),
_ => panic!("expected ShortFlag"),
}
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_long_flag() {
let result = parse("git push --force");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "git");
assert_eq!(cmd.args.len(), 2);
match &cmd.args[0] {
Arg::Positional(Expr::Literal(Value::String(s))) => assert_eq!(s, "push"),
_ => panic!("expected Positional push"),
}
match &cmd.args[1] {
Arg::LongFlag(name) => assert_eq!(name, "force"),
_ => panic!("expected LongFlag"),
}
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_long_flag_with_value() {
let result = parse(r#"git commit --message="hello""#);
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "git");
assert_eq!(cmd.args.len(), 2);
match &cmd.args[1] {
Arg::Named { key, value } => {
assert_eq!(key, "message");
match value {
Expr::Literal(Value::String(s)) => assert_eq!(s, "hello"),
_ => panic!("expected String value"),
}
}
_ => panic!("expected Named from --flag=value"),
}
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_mixed_flags_and_args() {
let result = parse(r#"git commit -m "message" --amend"#);
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "git");
assert_eq!(cmd.args.len(), 4);
assert!(matches!(&cmd.args[0], Arg::Positional(_)));
match &cmd.args[1] {
Arg::ShortFlag(name) => assert_eq!(name, "m"),
_ => panic!("expected ShortFlag -m"),
}
assert!(matches!(&cmd.args[2], Arg::Positional(_)));
match &cmd.args[3] {
Arg::LongFlag(name) => assert_eq!(name, "amend"),
_ => panic!("expected LongFlag --amend"),
}
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_redirect_stdout() {
let result = parse("cmd > file");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Pipeline(p) => {
assert_eq!(p.commands.len(), 1);
let cmd = &p.commands[0];
assert_eq!(cmd.redirects.len(), 1);
assert!(matches!(cmd.redirects[0].kind, RedirectKind::StdoutOverwrite));
}
_ => panic!("expected Pipeline"),
}
}
#[test]
fn parse_var_ref() {
let result = parse("echo ${VAR}");
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.args.len(), 1);
assert!(matches!(&cmd.args[0], Arg::Positional(Expr::VarRef(_))));
}
_ => panic!("expected Command"),
}
}
#[test]
fn parse_multiple_statements() {
let result = parse("a\nb\nc");
assert!(result.is_ok());
let program = result.expect("ok");
let non_empty: Vec<_> = program.statements.iter().filter(|s| !matches!(s, Stmt::Empty)).collect();
assert_eq!(non_empty.len(), 3);
}
#[test]
fn parse_semicolon_separated() {
let result = parse("a; b; c");
assert!(result.is_ok());
let program = result.expect("ok");
let non_empty: Vec<_> = program.statements.iter().filter(|s| !matches!(s, Stmt::Empty)).collect();
assert_eq!(non_empty.len(), 3);
}
#[test]
fn parse_complex_pipeline() {
let result = parse(r#"cat file | grep pattern="foo" | head count=10"#);
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Pipeline(p) => assert_eq!(p.commands.len(), 3),
_ => panic!("expected Pipeline"),
}
}
#[test]
fn parse_json_as_string_arg() {
let result = parse(r#"cmd '[[1, 2], [3, 4]]'"#);
assert!(result.is_ok());
}
#[test]
fn parse_mixed_args() {
let result = parse(r#"cmd pos1 key="val" pos2 num=42"#);
assert!(result.is_ok());
let program = result.expect("ok");
match &program.statements[0] {
Stmt::Command(cmd) => assert_eq!(cmd.args.len(), 4),
_ => panic!("expected Command"),
}
}
#[test]
fn error_unterminated_string() {
let result = parse(r#"echo "hello"#);
assert!(result.is_err());
}
#[test]
fn error_unterminated_var_ref() {
let result = parse("echo ${VAR");
assert!(result.is_err());
}
#[test]
fn error_missing_fi() {
let result = parse("if true; then echo");
assert!(result.is_err());
}
#[test]
fn error_missing_done() {
let result = parse("for X in items; do echo");
assert!(result.is_err());
}
#[test]
fn parse_nested_cmd_subst() {
let result = parse("X=$(echo $(date))").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => {
assert_eq!(a.name, "X");
match &a.value {
Expr::CommandSubst(outer) => {
assert_eq!(outer.commands[0].name, "echo");
match &outer.commands[0].args[0] {
Arg::Positional(Expr::CommandSubst(inner)) => {
assert_eq!(inner.commands[0].name, "date");
}
other => panic!("expected nested cmd subst, got {:?}", other),
}
}
other => panic!("expected cmd subst, got {:?}", other),
}
}
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn parse_deeply_nested_cmd_subst() {
let result = parse("X=$(a $(b $(c)))").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => match &a.value {
Expr::CommandSubst(level1) => {
assert_eq!(level1.commands[0].name, "a");
match &level1.commands[0].args[0] {
Arg::Positional(Expr::CommandSubst(level2)) => {
assert_eq!(level2.commands[0].name, "b");
match &level2.commands[0].args[0] {
Arg::Positional(Expr::CommandSubst(level3)) => {
assert_eq!(level3.commands[0].name, "c");
}
other => panic!("expected level3 cmd subst, got {:?}", other),
}
}
other => panic!("expected level2 cmd subst, got {:?}", other),
}
}
other => panic!("expected cmd subst, got {:?}", other),
},
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn value_int_preserved() {
let result = parse("X=42").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => {
assert_eq!(a.name, "X");
match &a.value {
Expr::Literal(Value::Int(n)) => assert_eq!(*n, 42),
other => panic!("expected int literal, got {:?}", other),
}
}
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn value_negative_int_preserved() {
let result = parse("X=-99").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => match &a.value {
Expr::Literal(Value::Int(n)) => assert_eq!(*n, -99),
other => panic!("expected int, got {:?}", other),
},
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn value_float_preserved() {
let result = parse("PI=3.14").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => match &a.value {
Expr::Literal(Value::Float(f)) => assert!((*f - 3.14).abs() < 0.001),
other => panic!("expected float, got {:?}", other),
},
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn value_string_preserved() {
let result = parse(r#"echo "hello world""#).unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "echo");
match &cmd.args[0] {
Arg::Positional(Expr::Literal(Value::String(s))) => {
assert_eq!(s, "hello world");
}
other => panic!("expected string arg, got {:?}", other),
}
}
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_string_with_escapes_preserved() {
let result = parse(r#"echo "line1\nline2""#).unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::Literal(Value::String(s))) => {
assert_eq!(s, "line1\nline2");
}
other => panic!("expected string, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_command_name_preserved() {
let result = parse("my-command").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => assert_eq!(cmd.name, "my-command"),
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_assignment_name_preserved() {
let result = parse("MY_VAR=1").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => assert_eq!(a.name, "MY_VAR"),
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn value_for_variable_preserved() {
let result = parse("for ITEM in items; do echo; done").unwrap();
match &result.statements[0] {
Stmt::For(f) => assert_eq!(f.variable, "ITEM"),
other => panic!("expected for, got {:?}", other),
}
}
#[test]
fn value_varref_name_preserved() {
let result = parse("echo ${MESSAGE}").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::VarRef(path)) => {
assert_eq!(path.segments.len(), 1);
let VarSegment::Field(name) = &path.segments[0];
assert_eq!(name, "MESSAGE");
}
other => panic!("expected varref, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_varref_field_access_preserved() {
let result = parse("echo ${RESULT.data}").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::VarRef(path)) => {
assert_eq!(path.segments.len(), 2);
let VarSegment::Field(a) = &path.segments[0];
let VarSegment::Field(b) = &path.segments[1];
assert_eq!(a, "RESULT");
assert_eq!(b, "data");
}
other => panic!("expected varref, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_varref_index_ignored() {
let result = parse("echo ${ITEMS[0]}").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::VarRef(path)) => {
assert_eq!(path.segments.len(), 1);
let VarSegment::Field(name) = &path.segments[0];
assert_eq!(name, "ITEMS");
}
other => panic!("expected varref, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_named_arg_preserved() {
let result = parse("cmd count=42").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "cmd");
match &cmd.args[0] {
Arg::WordAssign { key, value } => {
assert_eq!(key, "count");
match value {
Expr::Literal(Value::Int(n)) => assert_eq!(*n, 42),
other => panic!("expected int, got {:?}", other),
}
}
other => panic!("expected WordAssign arg, got {:?}", other),
}
}
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn value_function_def_name_preserved() {
let result = parse("greet() { echo }").unwrap();
match &result.statements[0] {
Stmt::ToolDef(t) => {
assert_eq!(t.name, "greet");
assert!(t.params.is_empty());
}
other => panic!("expected function def, got {:?}", other),
}
}
#[test]
fn parse_comparison_equals() {
let result = parse("if [[ ${X} == 5 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { left, op, right } => {
assert!(matches!(left.as_ref(), Expr::VarRef(_)));
assert_eq!(*op, TestCmpOp::Eq);
match right.as_ref() {
Expr::Literal(Value::Int(n)) => assert_eq!(*n, 5),
other => panic!("expected int, got {:?}", other),
}
}
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_comparison_not_equals() {
let result = parse("if [[ ${X} != 0 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NotEq),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_comparison_less_than() {
let result = parse("if [[ ${COUNT} -lt 10 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NumLt),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_comparison_greater_than() {
let result = parse("if [[ ${COUNT} -gt 0 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NumGt),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_comparison_less_equal() {
let result = parse("if [[ ${X} -le 100 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NumLtEq),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_comparison_greater_equal() {
let result = parse("if [[ ${X} -ge 1 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NumGtEq),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_regex_match() {
let result = parse(r#"if [[ ${NAME} =~ "^test" ]]; then echo; fi"#).unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::Match),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_regex_not_match() {
let result = parse(r#"if [[ ${NAME} !~ "^test" ]]; then echo; fi"#).unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op, .. } => assert_eq!(*op, TestCmpOp::NotMatch),
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_string_interpolation() {
let result = parse(r#"echo "Hello ${NAME}!""#).unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::Interpolated(parts)) => {
assert_eq!(parts.len(), 3);
match &parts[0] {
StringPart::Literal(s) => assert_eq!(s, "Hello "),
other => panic!("expected literal, got {:?}", other),
}
match &parts[1] {
StringPart::Var(path) => {
assert_eq!(path.segments.len(), 1);
let VarSegment::Field(name) = &path.segments[0];
assert_eq!(name, "NAME");
}
other => panic!("expected var, got {:?}", other),
}
match &parts[2] {
StringPart::Literal(s) => assert_eq!(s, "!"),
other => panic!("expected literal, got {:?}", other),
}
}
other => panic!("expected interpolated, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn parse_string_interpolation_multiple_vars() {
let result = parse(r#"echo "${FIRST} and ${SECOND}""#).unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => match &cmd.args[0] {
Arg::Positional(Expr::Interpolated(parts)) => {
assert_eq!(parts.len(), 3);
assert!(matches!(&parts[0], StringPart::Var(_)));
assert!(matches!(&parts[1], StringPart::Literal(_)));
assert!(matches!(&parts[2], StringPart::Var(_)));
}
other => panic!("expected interpolated, got {:?}", other),
},
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn parse_empty_function_body() {
let result = parse("empty() { }").unwrap();
match &result.statements[0] {
Stmt::ToolDef(t) => {
assert_eq!(t.name, "empty");
assert!(t.params.is_empty());
assert!(t.body.is_empty());
}
other => panic!("expected function def, got {:?}", other),
}
}
#[test]
fn parse_bash_style_function() {
let result = parse("function greet { echo hello }").unwrap();
match &result.statements[0] {
Stmt::ToolDef(t) => {
assert_eq!(t.name, "greet");
assert!(t.params.is_empty());
assert_eq!(t.body.len(), 1);
}
other => panic!("expected function def, got {:?}", other),
}
}
#[test]
fn parse_comparison_string_values() {
let result = parse(r#"if [[ ${STATUS} == "ok" ]]; then echo; fi"#).unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { left, op, right } => {
assert!(matches!(left.as_ref(), Expr::VarRef(_)));
assert_eq!(*op, TestCmpOp::Eq);
match right.as_ref() {
Expr::Literal(Value::String(s)) => assert_eq!(s, "ok"),
other => panic!("expected string, got {:?}", other),
}
}
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test expr, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_cmd_subst_simple() {
let result = parse("X=$(echo)").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => {
assert_eq!(a.name, "X");
match &a.value {
Expr::CommandSubst(pipeline) => {
assert_eq!(pipeline.commands.len(), 1);
assert_eq!(pipeline.commands[0].name, "echo");
}
other => panic!("expected command subst, got {:?}", other),
}
}
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn parse_cmd_subst_with_args() {
let result = parse(r#"X=$(fetch url="http://example.com")"#).unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => match &a.value {
Expr::CommandSubst(pipeline) => {
assert_eq!(pipeline.commands[0].name, "fetch");
assert_eq!(pipeline.commands[0].args.len(), 1);
match &pipeline.commands[0].args[0] {
Arg::WordAssign { key, .. } => assert_eq!(key, "url"),
other => panic!("expected WordAssign arg, got {:?}", other),
}
}
other => panic!("expected command subst, got {:?}", other),
},
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn parse_cmd_subst_pipeline() {
let result = parse("X=$(cat file | grep pattern)").unwrap();
match &result.statements[0] {
Stmt::Assignment(a) => match &a.value {
Expr::CommandSubst(pipeline) => {
assert_eq!(pipeline.commands.len(), 2);
assert_eq!(pipeline.commands[0].name, "cat");
assert_eq!(pipeline.commands[1].name, "grep");
}
other => panic!("expected command subst, got {:?}", other),
},
other => panic!("expected assignment, got {:?}", other),
}
}
#[test]
fn parse_cmd_subst_in_condition() {
let result = parse("if kaish-validate; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::Command(cmd) => {
assert_eq!(cmd.name, "kaish-validate");
}
other => panic!("expected command, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_cmd_subst_in_command_arg() {
let result = parse("echo $(whoami)").unwrap();
match &result.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "echo");
match &cmd.args[0] {
Arg::Positional(Expr::CommandSubst(pipeline)) => {
assert_eq!(pipeline.commands[0].name, "whoami");
}
other => panic!("expected command subst, got {:?}", other),
}
}
other => panic!("expected command, got {:?}", other),
}
}
#[test]
fn parse_condition_and() {
let result = parse("if check-a && check-b; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::BinaryOp { left, op, right } => {
assert_eq!(*op, BinaryOp::And);
assert!(matches!(left.as_ref(), Expr::Command(_)));
assert!(matches!(right.as_ref(), Expr::Command(_)));
}
other => panic!("expected binary op, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_condition_or() {
let result = parse("if try-a || try-b; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::BinaryOp { left, op, right } => {
assert_eq!(*op, BinaryOp::Or);
assert!(matches!(left.as_ref(), Expr::Command(_)));
assert!(matches!(right.as_ref(), Expr::Command(_)));
}
other => panic!("expected binary op, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_condition_and_or_precedence() {
let result = parse("if cmd-a && cmd-b || cmd-c; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::BinaryOp { left, op, right } => {
assert_eq!(*op, BinaryOp::Or);
match left.as_ref() {
Expr::BinaryOp { op: inner_op, .. } => {
assert_eq!(*inner_op, BinaryOp::And);
}
other => panic!("expected binary op (&&), got {:?}", other),
}
assert!(matches!(right.as_ref(), Expr::Command(_)));
}
other => panic!("expected binary op, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_condition_multiple_and() {
let result = parse("if cmd-a && cmd-b && cmd-c; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::BinaryOp { left, op, .. } => {
assert_eq!(*op, BinaryOp::And);
match left.as_ref() {
Expr::BinaryOp { op: inner_op, .. } => {
assert_eq!(*inner_op, BinaryOp::And);
}
other => panic!("expected binary op, got {:?}", other),
}
}
other => panic!("expected binary op, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn parse_condition_mixed_comparison_and_logical() {
let result = parse("if [[ ${X} == 5 ]] && [[ ${Y} -gt 0 ]]; then echo; fi").unwrap();
match &result.statements[0] {
Stmt::If(if_stmt) => match if_stmt.condition.as_ref() {
Expr::BinaryOp { left, op, right } => {
assert_eq!(*op, BinaryOp::And);
match left.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op: left_op, .. } => {
assert_eq!(*left_op, TestCmpOp::Eq);
}
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test, got {:?}", other),
}
match right.as_ref() {
Expr::Test(test) => match test.as_ref() {
TestExpr::Comparison { op: right_op, .. } => {
assert_eq!(*right_op, TestCmpOp::NumGt);
}
other => panic!("expected comparison, got {:?}", other),
},
other => panic!("expected test, got {:?}", other),
}
}
other => panic!("expected binary op, got {:?}", other),
},
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn script_level1_linear() {
let script = r#"
NAME="kaish"
VERSION=1
TIMEOUT=30
ITEMS="alpha beta gamma"
echo "Starting ${NAME} v${VERSION}"
cat "README.md" | grep pattern="install" | head count=5
fetch url="https://api.example.com/status" timeout=${TIMEOUT} > "/tmp/status.json"
echo "Items: ${ITEMS}"
"#;
let result = parse(script).unwrap();
let stmts: Vec<_> = result.statements.iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect();
assert_eq!(stmts.len(), 8);
assert!(matches!(stmts[0], Stmt::Assignment(_))); assert!(matches!(stmts[1], Stmt::Assignment(_))); assert!(matches!(stmts[2], Stmt::Assignment(_))); assert!(matches!(stmts[3], Stmt::Assignment(_))); assert!(matches!(stmts[4], Stmt::Command(_))); assert!(matches!(stmts[5], Stmt::Pipeline(_))); assert!(matches!(stmts[6], Stmt::Pipeline(_))); assert!(matches!(stmts[7], Stmt::Command(_))); }
#[test]
fn script_level2_branching() {
let script = r#"
RESULT=$(kaish-validate "input.json")
if [[ ${RESULT.ok} == true ]]; then
echo "Validation passed"
process "input.json" > "output.json"
else
echo "Validation failed: ${RESULT.err}"
fi
if [[ ${COUNT} -gt 0 ]] && [[ ${COUNT} -le 100 ]]; then
echo "Count in valid range"
fi
if check-network || check-cache; then
fetch url=${URL}
fi
"#;
let result = parse(script).unwrap();
let stmts: Vec<_> = result.statements.iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect();
assert_eq!(stmts.len(), 4);
match stmts[0] {
Stmt::Assignment(a) => {
assert_eq!(a.name, "RESULT");
assert!(matches!(&a.value, Expr::CommandSubst(_)));
}
other => panic!("expected assignment, got {:?}", other),
}
match stmts[1] {
Stmt::If(if_stmt) => {
assert_eq!(if_stmt.then_branch.len(), 2);
assert!(if_stmt.else_branch.is_some());
assert_eq!(if_stmt.else_branch.as_ref().unwrap().len(), 1);
}
other => panic!("expected if, got {:?}", other),
}
match stmts[2] {
Stmt::If(if_stmt) => {
match if_stmt.condition.as_ref() {
Expr::BinaryOp { op, .. } => assert_eq!(*op, BinaryOp::And),
other => panic!("expected && condition, got {:?}", other),
}
}
other => panic!("expected if, got {:?}", other),
}
match stmts[3] {
Stmt::If(if_stmt) => {
match if_stmt.condition.as_ref() {
Expr::BinaryOp { op, left, right } => {
assert_eq!(*op, BinaryOp::Or);
assert!(matches!(left.as_ref(), Expr::Command(_)));
assert!(matches!(right.as_ref(), Expr::Command(_)));
}
other => panic!("expected || condition, got {:?}", other),
}
}
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn script_level3_loops_and_functions() {
let script = r#"
greet() {
echo "Hello, $1!"
}
fetch_all() {
for URL in $@; do
fetch url=${URL}
done
}
USERS="alice bob charlie"
for USER in ${USERS}; do
greet ${USER}
if [[ ${USER} == "bob" ]]; then
echo "Found Bob!"
fi
done
long-running-task &
"#;
let result = parse(script).unwrap();
let stmts: Vec<_> = result.statements.iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect();
assert_eq!(stmts.len(), 5);
match stmts[0] {
Stmt::ToolDef(t) => {
assert_eq!(t.name, "greet");
assert!(t.params.is_empty());
}
other => panic!("expected function def, got {:?}", other),
}
match stmts[1] {
Stmt::ToolDef(t) => {
assert_eq!(t.name, "fetch_all");
assert_eq!(t.body.len(), 1);
assert!(matches!(&t.body[0], Stmt::For(_)));
}
other => panic!("expected function def, got {:?}", other),
}
assert!(matches!(stmts[2], Stmt::Assignment(_)));
match stmts[3] {
Stmt::For(f) => {
assert_eq!(f.variable, "USER");
assert_eq!(f.body.len(), 2);
assert!(matches!(&f.body[0], Stmt::Command(_)));
assert!(matches!(&f.body[1], Stmt::If(_)));
}
other => panic!("expected for loop, got {:?}", other),
}
match stmts[4] {
Stmt::Pipeline(p) => {
assert!(p.background);
assert_eq!(p.commands[0].name, "long-running-task");
}
other => panic!("expected pipeline (background), got {:?}", other),
}
}
#[test]
fn script_level4_complex_nesting() {
let script = r#"
RESULT=$(cat "config.json" | jq query=".servers" | kaish-validate schema="server-schema.json")
if ping host=${HOST} && [[ ${RESULT} == true ]]; then
for SERVER in "prod-1 prod-2"; do
deploy target=${SERVER} port=8080
if [[ $? -ne 0 ]]; then
notify channel="ops" message="Deploy failed"
fi
done
fi
"#;
let result = parse(script).unwrap();
let stmts: Vec<_> = result.statements.iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect();
assert_eq!(stmts.len(), 2);
match stmts[0] {
Stmt::Assignment(a) => {
assert_eq!(a.name, "RESULT");
match &a.value {
Expr::CommandSubst(pipeline) => {
assert_eq!(pipeline.commands.len(), 3);
}
other => panic!("expected command subst, got {:?}", other),
}
}
other => panic!("expected assignment, got {:?}", other),
}
match stmts[1] {
Stmt::If(if_stmt) => {
match if_stmt.condition.as_ref() {
Expr::BinaryOp { op, .. } => assert_eq!(*op, BinaryOp::And),
other => panic!("expected && condition, got {:?}", other),
}
assert_eq!(if_stmt.then_branch.len(), 1);
match &if_stmt.then_branch[0] {
Stmt::For(f) => {
assert_eq!(f.body.len(), 2);
assert!(matches!(&f.body[1], Stmt::If(_)));
}
other => panic!("expected for in if body, got {:?}", other),
}
}
other => panic!("expected if, got {:?}", other),
}
}
#[test]
fn script_level5_edge_cases() {
let script = r#"
echo ""
echo "quotes: \"nested\" here"
echo "escapes: \n\t\r\\"
echo "unicode: \u2764"
X=-99999
Y=3.14159265358979
Z=-0.001
cmd a=1 b="two" c=true d=false e=null
if true; then
if false; then
echo "inner"
else
echo "else"
fi
fi
for I in "a b c"; do
echo ${I}
done
no_params() {
echo "no params"
}
function all_args {
echo "args: $@"
}
a | b | c | d | e &
cmd 2> "errors.log"
cmd &> "all.log"
cmd >> "append.log"
cmd < "input.txt"
"#;
let result = parse(script).unwrap();
let stmts: Vec<_> = result.statements.iter()
.filter(|s| !matches!(s, Stmt::Empty))
.collect();
assert!(stmts.len() >= 10, "expected many statements, got {}", stmts.len());
let bg_stmt = stmts.iter().find(|s| matches!(s, Stmt::Pipeline(p) if p.background));
assert!(bg_stmt.is_some(), "expected background pipeline");
match bg_stmt.unwrap() {
Stmt::Pipeline(p) => {
assert_eq!(p.commands.len(), 5);
assert!(p.background);
}
_ => unreachable!(),
}
}
#[test]
fn parse_keyword_as_variable_rejected() {
let result = parse(r#"if="value""#);
assert!(result.is_err(), "if= should fail - 'if' is a keyword");
let result = parse("while=true");
assert!(result.is_err(), "while= should fail - 'while' is a keyword");
let result = parse(r#"then="next""#);
assert!(result.is_err(), "then= should fail - 'then' is a keyword");
}
#[test]
fn parse_set_command_with_flag() {
let result = parse("set -e");
assert!(result.is_ok(), "failed to parse set -e: {:?}", result);
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "set");
assert_eq!(cmd.args.len(), 1);
match &cmd.args[0] {
Arg::ShortFlag(f) => assert_eq!(f, "e"),
other => panic!("expected ShortFlag, got {:?}", other),
}
}
other => panic!("expected Command, got {:?}", other),
}
}
#[test]
fn parse_set_command_no_args() {
let result = parse("set");
assert!(result.is_ok(), "failed to parse set: {:?}", result);
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "set");
assert_eq!(cmd.args.len(), 0);
}
other => panic!("expected Command, got {:?}", other),
}
}
#[test]
fn parse_set_assignment_vs_command() {
let result = parse("X=5");
assert!(result.is_ok());
let program = result.unwrap();
assert!(matches!(&program.statements[0], Stmt::Assignment(_)));
let result = parse("set -e");
assert!(result.is_ok());
let program = result.unwrap();
assert!(matches!(&program.statements[0], Stmt::Command(_)));
}
#[test]
fn parse_true_as_command() {
let result = parse("true");
assert!(result.is_ok());
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => assert_eq!(cmd.name, "true"),
other => panic!("expected Command(true), got {:?}", other),
}
}
#[test]
fn parse_false_as_command() {
let result = parse("false");
assert!(result.is_ok());
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => assert_eq!(cmd.name, "false"),
other => panic!("expected Command(false), got {:?}", other),
}
}
#[test]
fn parse_dot_as_source_alias() {
let result = parse(". script.kai");
assert!(result.is_ok(), "failed to parse . script.kai: {:?}", result);
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, ".");
assert_eq!(cmd.args.len(), 1);
}
other => panic!("expected Command(.), got {:?}", other),
}
}
#[test]
fn parse_source_command() {
let result = parse("source utils.kai");
assert!(result.is_ok(), "failed to parse source: {:?}", result);
let program = result.unwrap();
match &program.statements[0] {
Stmt::Command(cmd) => {
assert_eq!(cmd.name, "source");
assert_eq!(cmd.args.len(), 1);
}
other => panic!("expected Command(source), got {:?}", other),
}
}
#[test]
fn parse_test_expr_file_test() {
let result = parse(r#"[[ -f "/path/file" ]]"#);
assert!(result.is_ok(), "failed to parse file test: {:?}", result);
}
#[test]
fn parse_test_expr_comparison() {
let result = parse(r#"[[ $X == "value" ]]"#);
assert!(result.is_ok(), "failed to parse comparison test: {:?}", result);
}
#[test]
fn parse_test_expr_single_eq() {
let result = parse(r#"[[ $X = "value" ]]"#);
assert!(result.is_ok(), "failed to parse single-= comparison: {:?}", result);
let program = result.unwrap();
match &program.statements[0] {
Stmt::Test(TestExpr::Comparison { op, .. }) => {
assert_eq!(op, &TestCmpOp::Eq);
}
other => panic!("expected Test(Comparison), got {:?}", other),
}
}
#[test]
fn parse_while_loop() {
let result = parse("while true; do echo; done");
assert!(result.is_ok(), "failed to parse while loop: {:?}", result);
let program = result.unwrap();
assert!(matches!(&program.statements[0], Stmt::While(_)));
}
#[test]
fn parse_break_with_level() {
let result = parse("break 2");
assert!(result.is_ok());
let program = result.unwrap();
match &program.statements[0] {
Stmt::Break(Some(n)) => assert_eq!(*n, 2),
other => panic!("expected Break(2), got {:?}", other),
}
}
#[test]
fn parse_continue_with_level() {
let result = parse("continue 3");
assert!(result.is_ok());
let program = result.unwrap();
match &program.statements[0] {
Stmt::Continue(Some(n)) => assert_eq!(*n, 3),
other => panic!("expected Continue(3), got {:?}", other),
}
}
#[test]
fn parse_exit_with_code() {
let result = parse("exit 1");
assert!(result.is_ok());
let program = result.unwrap();
match &program.statements[0] {
Stmt::Exit(Some(expr)) => {
match expr.as_ref() {
Expr::Literal(Value::Int(n)) => assert_eq!(*n, 1),
other => panic!("expected Int(1), got {:?}", other),
}
}
other => panic!("expected Exit(1), got {:?}", other),
}
}
#[test]
fn spanned_literal_only_records_byte_range() {
let parts = parse_interpolated_string_spanned("hello world", 100);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "hello world"));
assert_eq!(parts[0].offset, 100, "base_offset must propagate to literals");
assert_eq!(parts[0].len, 11);
}
#[test]
fn spanned_braced_var_at_zero() {
let parts = parse_interpolated_string_spanned("${X}", 50);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Var(_)));
assert_eq!(parts[0].offset, 50);
assert_eq!(parts[0].len, 4); }
#[test]
fn spanned_simple_var_then_literal() {
let parts = parse_interpolated_string_spanned("$X end", 10);
assert_eq!(parts.len(), 2);
assert!(matches!(&parts[0].part, StringPart::Var(_)));
assert_eq!(parts[0].offset, 10);
assert_eq!(parts[0].len, 2); assert!(matches!(&parts[1].part, StringPart::Literal(s) if s == " end"));
assert_eq!(parts[1].offset, 12);
assert_eq!(parts[1].len, 4);
}
#[test]
fn spanned_mixed_literal_var_literal() {
let parts = parse_interpolated_string_spanned("hi ${X} bye", 0);
assert_eq!(parts.len(), 3);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "hi "));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 3);
assert!(matches!(&parts[1].part, StringPart::Var(_)));
assert_eq!(parts[1].offset, 3);
assert_eq!(parts[1].len, 4);
assert!(matches!(&parts[2].part, StringPart::Literal(s) if s == " bye"));
assert_eq!(parts[2].offset, 7);
assert_eq!(parts[2].len, 4);
}
#[test]
fn spanned_positional_param() {
let parts = parse_interpolated_string_spanned("$1 done", 0);
assert_eq!(parts.len(), 2);
assert!(matches!(&parts[0].part, StringPart::Positional(1)));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 2); }
#[test]
fn spanned_special_dollar_dollar() {
let parts = parse_interpolated_string_spanned("$$", 5);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::CurrentPid));
assert_eq!(parts[0].offset, 5);
assert_eq!(parts[0].len, 2);
}
#[test]
fn spanned_arithmetic_marker_recognised() {
let parts = parse_interpolated_string_spanned("${__ARITH:1+2__}", 0);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Arithmetic(e) if e == "1+2"));
}
#[test]
fn spanned_default_separator_yields_var_with_default() {
let parts = parse_interpolated_string_spanned("${X:-fallback}", 0);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::VarWithDefault { .. }));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 14); }
#[test]
fn spanned_no_dollar_runs_one_literal() {
let parts = parse_interpolated_string_spanned("plain text only", 7);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "plain text only"));
assert_eq!(parts[0].offset, 7);
assert_eq!(parts[0].len, 15);
}
#[test]
fn spanned_matches_unspanned_part_count() {
let cases = [
"hello",
"$X",
"${X}",
"${X:-d}",
"hi $A and $B",
"$0 $1 $2",
"$$ $? $#",
];
for s in &cases {
let unspanned = parse_interpolated_string(s);
let spanned = parse_interpolated_string_spanned(s, 0);
assert_eq!(
unspanned.len(),
spanned.len(),
"part count differs for {:?}",
s
);
}
}
#[test]
fn spanned_multibyte_utf8_before_var_uses_byte_offsets() {
let parts = parse_interpolated_string_spanned("π ${X}", 0);
assert_eq!(parts.len(), 2);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "π "));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 5, "literal len must be bytes, not chars");
assert!(matches!(&parts[1].part, StringPart::Var(_)));
assert_eq!(parts[1].offset, 5, "var offset must be bytes, not chars");
assert_eq!(parts[1].len, 4);
}
#[test]
fn spanned_multibyte_utf8_pure_literal_is_byte_length() {
let parts = parse_interpolated_string_spanned("hello δΈη world", 0);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "hello δΈη world"));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 18);
}
#[test]
fn spanned_escape_dollar_consumes_two_bytes_emits_one_char() {
let parts = parse_interpolated_string_spanned("\\$", 0);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "$"));
assert_eq!(parts[0].offset, 0);
assert_eq!(parts[0].len, 2, "len is source byte length, not rendered length");
}
#[test]
fn spanned_escape_backslash_collapses_pair_to_one() {
let parts = parse_interpolated_string_spanned("\\\\", 0);
assert_eq!(parts.len(), 1);
assert!(matches!(&parts[0].part, StringPart::Literal(s) if s == "\\"));
assert_eq!(parts[0].len, 2);
}
}