use peg::parser;
use std::{path::PathBuf, rc::Rc};
mod expr;
pub use expr::*;
pub use peg;
#[derive(Default)]
pub struct ParserSettings {
pub loc_data: bool,
pub file_name: Rc<PathBuf>,
}
parser! {
grammar jsonnet_parser() for str {
use peg::ParseLiteral;
rule comment()
= "//" (!['\n'][_])* "\n"
/ "/*" ("\\*/" / "\\\\" / (!("*/")[_]))* "*/"
/ "#" (!['\n'][_])* "\n"
rule single_whitespace() = quiet!{([' ' | '\r' | '\n' | '\t'] / comment())} / expected!("<whitespace>")
rule _() = single_whitespace()*
rule comma() = quiet!{_ "," _} / expected!("<comma>")
rule alpha() -> char = c:$(['_' | 'a'..='z' | 'A'..='Z']) {c.chars().next().unwrap()}
rule digit() -> char = d:$(['0'..='9']) {d.chars().next().unwrap()}
rule end_of_ident() = !['0'..='9' | '_' | 'a'..='z' | 'A'..='Z']
rule uint() -> u64 = a:$(digit()+) { a.parse().unwrap() }
rule number() -> f64 = quiet!{a:$(uint() ("." uint())? (['e'|'E'] (s:['+'|'-'])? uint())?) { a.parse().unwrap() }} / expected!("<number>")
rule reserved() = ("assert" / "else" / "error" / "false" / "for" / "function" / "if" / "import" / "importstr" / "in" / "local" / "null" / "tailstrict" / "then" / "self" / "super" / "true") end_of_ident()
rule id() = quiet!{ !reserved() alpha() (alpha() / digit())*} / expected!("<identifier>")
rule keyword(id: &'static str)
= ##parse_string_literal(id) end_of_ident()
rule l(s: &ParserSettings, x: rule<Expr>) -> LocExpr
= start:position!() v:x() end:position!() {loc_expr!(v, s.loc_data, (s.file_name.clone(), start, end))}
pub rule param(s: &ParserSettings) -> expr::Param = name:$(id()) expr:(_ "=" _ expr:expr(s){expr})? { expr::Param(name.into(), expr) }
pub rule params(s: &ParserSettings) -> expr::ParamsDesc
= params:param(s) ** comma() comma()? {
let mut defaults_started = false;
for param in ¶ms {
defaults_started = defaults_started || param.1.is_some();
assert_eq!(defaults_started, param.1.is_some(), "defauld parameters should be used after all positionals");
}
expr::ParamsDesc(Rc::new(params))
}
/ { expr::ParamsDesc(Rc::new(Vec::new())) }
pub rule arg(s: &ParserSettings) -> expr::Arg
= name:$(id()) _ "=" _ expr:expr(s) {expr::Arg(Some(name.into()), expr)}
/ expr:expr(s) {expr::Arg(None, expr)}
pub rule args(s: &ParserSettings) -> expr::ArgsDesc
= args:arg(s) ** comma() comma()? {
let mut named_started = false;
for arg in &args {
named_started = named_started || arg.0.is_some();
assert_eq!(named_started, arg.0.is_some(), "named args should be used after all positionals");
}
expr::ArgsDesc(args)
}
/ { expr::ArgsDesc(Vec::new()) }
pub rule bind(s: &ParserSettings) -> expr::BindSpec
= name:$(id()) _ "=" _ expr:expr(s) {expr::BindSpec{name:name.into(), params: None, value: expr}}
/ name:$(id()) _ "(" _ params:params(s) _ ")" _ "=" _ expr:expr(s) {expr::BindSpec{name:name.into(), params: Some(params), value: expr}}
pub rule assertion(s: &ParserSettings) -> expr::AssertStmt
= keyword("assert") _ cond:expr(s) msg:(_ ":" _ e:expr(s) {e})? { expr::AssertStmt(cond, msg) }
pub rule whole_line() -> &'input str
= str:$((!['\n'][_])* "\n") {str}
pub rule string_block() -> String
= "|||" (!['\n']single_whitespace())* "\n"
prefix:[' ' | '\t']+ first_line:whole_line()
lines:([' ' | '\t']*<{prefix.len()}> s:whole_line() {s})*
[' ' | '\t']*<, {prefix.len() - 1}> "|||"
{let mut l = first_line.to_owned(); l.extend(lines); l}
pub rule string() -> String
= "\"" str:$(("\\\"" / "\\\\" / (!['"'][_]))*) "\"" {unescape::unescape(str).unwrap()}
/ "'" str:$(("\\'" / "\\\\" / (!['\''][_]))*) "'" {unescape::unescape(str).unwrap()}
/ "@'" str:$(("''" / (!['\''][_]))*) "'" {str.replace("''", "'")}
/ "@\"" str:$(("\"\"" / (!['"'][_]))*) "\"" {str.replace("\"\"", "\"")}
/ string_block()
pub rule field_name(s: &ParserSettings) -> expr::FieldName
= name:$(id()) {expr::FieldName::Fixed(name.into())}
/ name:string() {expr::FieldName::Fixed(name.into())}
/ "[" _ expr:expr(s) _ "]" {expr::FieldName::Dyn(expr)}
pub rule visibility() -> expr::Visibility
= ":::" {expr::Visibility::Unhide}
/ "::" {expr::Visibility::Hidden}
/ ":" {expr::Visibility::Normal}
pub rule field(s: &ParserSettings) -> expr::FieldMember
= name:field_name(s) _ plus:"+"? _ visibility:visibility() _ value:expr(s) {expr::FieldMember{
name,
plus: plus.is_some(),
params: None,
visibility,
value,
}}
/ name:field_name(s) _ "(" _ params:params(s) _ ")" _ visibility:visibility() _ value:expr(s) {expr::FieldMember{
name,
plus: false,
params: Some(params),
visibility,
value,
}}
pub rule obj_local(s: &ParserSettings) -> BindSpec
= keyword("local") _ bind:bind(s) {bind}
pub rule member(s: &ParserSettings) -> expr::Member
= bind:obj_local(s) {expr::Member::BindStmt(bind)}
/ assertion:assertion(s) {expr::Member::AssertStmt(assertion)}
/ field:field(s) {expr::Member::Field(field)}
pub rule objinside(s: &ParserSettings) -> expr::ObjBody
= pre_locals:(b: obj_local(s) comma() {b})* "[" _ key:expr(s) _ "]" _ ":" _ value:expr(s) post_locals:(comma() b:obj_local(s) {b})* _ forspec:forspec(s) others:(_ rest:compspec(s) {rest})? {
let mut compspecs = vec![CompSpec::ForSpec(forspec)];
compspecs.extend(others.unwrap_or_default());
expr::ObjBody::ObjComp(expr::ObjComp{
pre_locals,
key,
value,
post_locals,
compspecs,
})
}
/ members:(member(s) ** comma()) comma()? {expr::ObjBody::MemberList(members)}
pub rule ifspec(s: &ParserSettings) -> IfSpecData
= keyword("if") _ expr:expr(s) {IfSpecData(expr)}
pub rule forspec(s: &ParserSettings) -> ForSpecData
= keyword("for") _ id:$(id()) _ keyword("in") _ cond:expr(s) {ForSpecData(id.into(), cond)}
pub rule compspec(s: &ParserSettings) -> Vec<expr::CompSpec>
= s:(i:ifspec(s) { expr::CompSpec::IfSpec(i) } / f:forspec(s) {expr::CompSpec::ForSpec(f)} ) ** _ {s}
pub rule local_expr(s: &ParserSettings) -> LocExpr
= l(s,<keyword("local") _ binds:bind(s) ** comma() _ ";" _ expr:expr(s) { Expr::LocalExpr(binds, expr) }>)
pub rule string_expr(s: &ParserSettings) -> LocExpr
= l(s, <s:string() {Expr::Str(s.into())}>)
pub rule obj_expr(s: &ParserSettings) -> LocExpr
= l(s,<"{" _ body:objinside(s) _ "}" {Expr::Obj(body)}>)
pub rule array_expr(s: &ParserSettings) -> LocExpr
= l(s,<"[" _ elems:(expr(s) ** comma()) _ comma()? "]" {Expr::Arr(elems)}>)
pub rule array_comp_expr(s: &ParserSettings) -> LocExpr
= l(s,<"[" _ expr:expr(s) _ comma()? _ forspec:forspec(s) _ others:(others: compspec(s) _ {others})? "]" {
let mut specs = vec![CompSpec::ForSpec(forspec)];
specs.extend(others.unwrap_or_default());
Expr::ArrComp(expr, specs)
}>)
pub rule number_expr(s: &ParserSettings) -> LocExpr
= l(s,<n:number() { expr::Expr::Num(n) }>)
pub rule var_expr(s: &ParserSettings) -> LocExpr
= l(s,<n:$(id()) { expr::Expr::Var(n.into()) }>)
pub rule if_then_else_expr(s: &ParserSettings) -> LocExpr
= l(s,<cond:ifspec(s) _ keyword("then") _ cond_then:expr(s) cond_else:(_ keyword("else") _ e:expr(s) {e})? {Expr::IfElse{
cond,
cond_then,
cond_else,
}}>)
pub rule literal(s: &ParserSettings) -> LocExpr
= l(s,<v:(
keyword("null") {LiteralType::Null}
/ keyword("true") {LiteralType::True}
/ keyword("false") {LiteralType::False}
/ keyword("self") {LiteralType::This}
/ keyword("$") {LiteralType::Dollar}
/ keyword("super") {LiteralType::Super}
) {Expr::Literal(v)}>)
pub rule expr_basic(s: &ParserSettings) -> LocExpr
= literal(s)
/ string_expr(s) / number_expr(s)
/ array_expr(s)
/ obj_expr(s)
/ array_expr(s)
/ array_comp_expr(s)
/ l(s,<keyword("importstr") _ path:string() {Expr::ImportStr(PathBuf::from(path))}>)
/ l(s,<keyword("import") _ path:string() {Expr::Import(PathBuf::from(path))}>)
/ var_expr(s)
/ local_expr(s)
/ if_then_else_expr(s)
/ l(s,<keyword("function") _ "(" _ params:params(s) _ ")" _ expr:expr(s) {Expr::Function(params, expr)}>)
/ l(s,<assertion:assertion(s) _ ";" _ expr:expr(s) { Expr::AssertExpr(assertion, expr) }>)
/ l(s,<keyword("error") _ expr:expr(s) { Expr::ErrorStmt(expr) }>)
rule slice_part(s: &ParserSettings) -> Option<LocExpr>
= e:(_ e:expr(s) _{e})? {e}
pub rule slice_desc(s: &ParserSettings) -> SliceDesc
= start:slice_part(s) ":" pair:(end:slice_part(s) step:(":" e:slice_part(s){e})? {(end, step.flatten())})? {
let (end, step) = if let Some((end, step)) = pair {
(end, step)
}else{
(None, None)
};
SliceDesc { start, end, step }
}
rule expr(s: &ParserSettings) -> LocExpr
= start:position!() a:precedence! {
a:(@) _ "||" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Or, b))}
--
a:(@) _ "&&" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::And, b))}
--
a:(@) _ "|" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::BitOr, b))}
--
a:@ _ "^" _ b:(@) {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::BitXor, b))}
--
a:(@) _ "&" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::BitAnd, b))}
--
a:(@) _ "==" _ b:@ {loc_expr_todo!(Expr::Apply(
el!(Expr::Index(
el!(Expr::Var("std".into())),
el!(Expr::Str("equals".into()))
)),
ArgsDesc(vec![Arg(None, a), Arg(None, b)]),
true
))}
a:(@) _ "!=" _ b:@ {loc_expr_todo!(Expr::UnaryOp(UnaryOpType::Not, el!(Expr::Apply(
el!(Expr::Index(
el!(Expr::Var("std".into())),
el!(Expr::Str("equals".into()))
)),
ArgsDesc(vec![Arg(None, a), Arg(None, b)]),
true
))))}
--
a:(@) _ "<" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Lt, b))}
a:(@) _ ">" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Gt, b))}
a:(@) _ "<=" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Lte, b))}
a:(@) _ ">=" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Gte, b))}
a:(@) _ keyword("in") _ b:@ {loc_expr_todo!(Expr::Apply(
el!(Expr::Index(
el!(Expr::Var("std".into())),
el!(Expr::Str("objectHasEx".into()))
)), ArgsDesc(vec![Arg(None, b), Arg(None, a), Arg(None, el!(Expr::Literal(LiteralType::True)))]),
true
))}
--
a:(@) _ "<<" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Lhs, b))}
a:(@) _ ">>" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Rhs, b))}
--
a:(@) _ "+" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Add, b))}
a:(@) _ "-" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Sub, b))}
--
a:(@) _ "*" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Mul, b))}
a:(@) _ "/" _ b:@ {loc_expr_todo!(Expr::BinaryOp(a, BinaryOpType::Div, b))}
a:(@) _ "%" _ b:@ {loc_expr_todo!(Expr::Apply(
el!(Expr::Index(
el!(Expr::Var("std".into())),
el!(Expr::Str("mod".into()))
)), ArgsDesc(vec![Arg(None, a), Arg(None, b)]),
false
))}
--
"-" _ b:@ {loc_expr_todo!(Expr::UnaryOp(UnaryOpType::Minus, b))}
"!" _ b:@ {loc_expr_todo!(Expr::UnaryOp(UnaryOpType::Not, b))}
"~" _ b:@ { loc_expr_todo!(Expr::UnaryOp(UnaryOpType::BitNot, b)) }
--
a:(@) _ "[" _ s:slice_desc(s) _ "]" {loc_expr_todo!(Expr::Apply(
el!(Expr::Index(
el!(Expr::Var("std".into())),
el!(Expr::Str("slice".into())),
)),
ArgsDesc(vec![
Arg(None, a),
Arg(None, s.start.unwrap_or_else(||el!(Expr::Literal(LiteralType::Null)))),
Arg(None, s.end.unwrap_or_else(||el!(Expr::Literal(LiteralType::Null)))),
Arg(None, s.step.unwrap_or_else(||el!(Expr::Literal(LiteralType::Null)))),
]),
true,
))}
a:(@) _ "." _ s:$(id()) {loc_expr_todo!(Expr::Index(a, el!(Expr::Str(s.into()))))}
a:(@) _ "[" _ s:expr(s) _ "]" {loc_expr_todo!(Expr::Index(a, s))}
a:(@) _ "(" _ args:args(s) _ ")" ts:(_ keyword("tailstrict"))? {loc_expr_todo!(Expr::Apply(a, args, ts.is_some()))}
a:(@) _ "{" _ body:objinside(s) _ "}" {loc_expr_todo!(Expr::ObjExtend(a, body))}
--
e:expr_basic(s) {e}
"(" _ e:expr(s) _ ")" {loc_expr_todo!(Expr::Parened(e))}
} end:position!() {
let LocExpr(e, _) = a;
LocExpr(e, if s.loc_data {
Some(ExprLocation(s.file_name.clone(), start, end))
} else {
None
})
}
/ e:expr_basic(s) {e}
pub rule jsonnet(s: &ParserSettings) -> LocExpr = _ e:expr(s) _ {e}
}
}
pub type ParseError = peg::error::ParseError<peg::str::LineCol>;
pub fn parse(str: &str, settings: &ParserSettings) -> Result<LocExpr, ParseError> {
jsonnet_parser::jsonnet(str, settings)
}
#[macro_export]
macro_rules! el {
($expr:expr) => {
LocExpr(std::rc::Rc::new($expr), None)
};
}
#[cfg(test)]
pub mod tests {
use super::{expr::*, parse};
use crate::ParserSettings;
use std::path::PathBuf;
use std::rc::Rc;
macro_rules! parse {
($s:expr) => {
parse(
$s,
&ParserSettings {
loc_data: false,
file_name: Rc::new(PathBuf::from("/test.jsonnet")),
},
)
.unwrap()
};
}
mod expressions {
use super::*;
pub fn basic_math() -> LocExpr {
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Add,
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Mul,
el!(Expr::Num(2.0)),
)),
))
}
}
#[test]
fn multiline_string() {
assert_eq!(
parse!("|||\n Hello world!\n a\n|||"),
el!(Expr::Str("Hello world!\n a\n".into())),
);
assert_eq!(
parse!("|||\n Hello world!\n a\n|||"),
el!(Expr::Str("Hello world!\n a\n".into())),
);
assert_eq!(
parse!("|||\n\t\tHello world!\n\t\t\ta\n|||"),
el!(Expr::Str("Hello world!\n\ta\n".into())),
);
assert_eq!(
parse!("|||\n Hello world!\n a\n |||"),
el!(Expr::Str("Hello world!\n a\n".into())),
);
}
#[test]
fn slice() {
parse!("a[1:]");
parse!("a[1::]");
parse!("a[:1:]");
parse!("a[::1]");
parse!("str[:len - 1]");
}
#[test]
fn string_escaping() {
assert_eq!(
parse!(r#""Hello, \"world\"!""#),
el!(Expr::Str(r#"Hello, "world"!"#.into())),
);
assert_eq!(
parse!(r#"'Hello \'world\'!'"#),
el!(Expr::Str("Hello 'world'!".into())),
);
assert_eq!(parse!(r#"'\\\\'"#), el!(Expr::Str("\\\\".into())),);
}
#[test]
fn string_unescaping() {
assert_eq!(
parse!(r#""Hello\nWorld""#),
el!(Expr::Str("Hello\nWorld".into())),
);
}
#[test]
fn string_verbantim() {
assert_eq!(
parse!(r#"@"Hello\n""World""""#),
el!(Expr::Str("Hello\\n\"World\"".into())),
);
}
#[test]
fn imports() {
assert_eq!(
parse!("import \"hello\""),
el!(Expr::Import(PathBuf::from("hello"))),
);
assert_eq!(
parse!("importstr \"garnish.txt\""),
el!(Expr::ImportStr(PathBuf::from("garnish.txt")))
);
}
#[test]
fn empty_object() {
assert_eq!(parse!("{}"), el!(Expr::Obj(ObjBody::MemberList(vec![]))));
}
#[test]
fn basic_math() {
assert_eq!(
parse!("2+2*2"),
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Add,
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Mul,
el!(Expr::Num(2.0))
))
))
);
}
#[test]
fn basic_math_with_indents() {
assert_eq!(parse!("2 + 2 * 2 "), expressions::basic_math());
}
#[test]
fn basic_math_parened() {
assert_eq!(
parse!("2+(2+2*2)"),
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Add,
el!(Expr::Parened(expressions::basic_math())),
))
);
}
#[test]
fn comments() {
assert_eq!(
parse!("2//comment\n+//comment\n3/*test*/*/*test*/4"),
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Add,
el!(Expr::BinaryOp(
el!(Expr::Num(3.0)),
BinaryOpType::Mul,
el!(Expr::Num(4.0))
))
))
);
}
#[test]
fn comment_escaping() {
assert_eq!(
parse!("2/*\\*/+*/ - 22"),
el!(Expr::BinaryOp(
el!(Expr::Num(2.0)),
BinaryOpType::Sub,
el!(Expr::Num(22.0))
))
);
}
#[test]
fn suffix() {
}
#[test]
fn array_comp() {
use Expr::*;
assert_eq!(
parse!("[std.deepJoin(x) for x in arr]"),
el!(ArrComp(
el!(Apply(
el!(Index(el!(Var("std".into())), el!(Str("deepJoin".into())))),
ArgsDesc(vec![Arg(None, el!(Var("x".into())))]),
false,
)),
vec![CompSpec::ForSpec(ForSpecData(
"x".into(),
el!(Var("arr".into()))
))]
)),
)
}
#[test]
fn reserved() {
use Expr::*;
assert_eq!(parse!("null"), el!(Literal(LiteralType::Null)));
assert_eq!(parse!("nulla"), el!(Var("nulla".into())));
}
#[test]
fn multiple_args_buf() {
parse!("a(b, null_fields)");
}
#[test]
fn infix_precedence() {
use Expr::*;
assert_eq!(
parse!("!a && !b"),
el!(BinaryOp(
el!(UnaryOp(UnaryOpType::Not, el!(Var("a".into())))),
BinaryOpType::And,
el!(UnaryOp(UnaryOpType::Not, el!(Var("b".into()))))
))
);
}
#[test]
fn infix_precedence_division() {
use Expr::*;
assert_eq!(
parse!("!a / !b"),
el!(BinaryOp(
el!(UnaryOp(UnaryOpType::Not, el!(Var("a".into())))),
BinaryOpType::Div,
el!(UnaryOp(UnaryOpType::Not, el!(Var("b".into()))))
))
);
}
#[test]
fn double_negation() {
use Expr::*;
assert_eq!(
parse!("!!a"),
el!(UnaryOp(
UnaryOpType::Not,
el!(UnaryOp(UnaryOpType::Not, el!(Var("a".into()))))
))
)
}
#[test]
fn array_test_error() {
parse!("[a for a in b if c for e in f]");
}
#[test]
fn can_parse_stdlib() {
parse!(jrsonnet_stdlib::STDLIB_STR);
}
}