#![no_std]
#![forbid(unsafe_code)]
#![warn(missing_docs)]
extern crate alloc;
#[cfg(feature = "std")]
extern crate std;
pub mod input;
#[cfg(feature = "math")]
mod math;
#[cfg(feature = "regex")]
mod regex;
#[cfg(feature = "time")]
mod time;
use alloc::string::{String, ToString};
use alloc::{boxed::Box, vec::Vec};
use bstr::{BStr, ByteSlice};
use jaq_core::box_iter::{box_once, BoxIter};
use jaq_core::native::{bome, run, unary, v, Filter, Fun};
use jaq_core::{load, Bind, Cv, DataT, Error, Exn, RunPtr, ValR, ValT as _, ValX, ValXs};
pub fn defs() -> impl Iterator<Item = load::parse::Def<&'static str>> {
load::parse(include_str!("defs.jq"), |p| p.defs())
.unwrap()
.into_iter()
}
#[cfg(all(
feature = "std",
feature = "format",
feature = "log",
feature = "math",
feature = "regex",
feature = "time",
))]
pub fn funs<D: DataT>() -> impl Iterator<Item = Fun<D>>
where
for<'a> D::V<'a>: ValT,
{
base_funs().chain(extra_funs())
}
pub fn base_funs<D: DataT>() -> impl Iterator<Item = Fun<D>>
where
for<'a> D::V<'a>: ValT,
{
base_run().into_vec().into_iter().map(run)
}
#[cfg(all(
feature = "std",
feature = "format",
feature = "log",
feature = "math",
feature = "regex",
feature = "time",
))]
pub fn extra_funs<D: DataT>() -> impl Iterator<Item = Fun<D>>
where
for<'a> D::V<'a>: ValT,
{
[std(), format(), math(), regex(), time(), log()]
.into_iter()
.flat_map(|fs| fs.into_vec().into_iter().map(run))
}
pub trait ValT: jaq_core::ValT + Ord + From<f64> + From<usize> {
fn into_seq<S: FromIterator<Self>>(self) -> Result<S, Self>;
fn is_int(&self) -> bool;
fn as_isize(&self) -> Option<isize>;
fn as_f64(&self) -> Option<f64>;
fn is_utf8_str(&self) -> bool;
fn as_bytes(&self) -> Option<&[u8]>;
fn as_utf8_bytes(&self) -> Option<&[u8]> {
self.is_utf8_str().then(|| self.as_bytes()).flatten()
}
fn try_as_bytes(&self) -> Result<&[u8], Error<Self>> {
self.as_bytes().ok_or_else(|| self.fail_str())
}
fn try_as_utf8_bytes(&self) -> Result<&[u8], Error<Self>> {
self.as_utf8_bytes().ok_or_else(|| self.fail_str())
}
fn as_sub_str(&self, sub: &[u8]) -> Self;
fn from_utf8_bytes(b: impl AsRef<[u8]> + Send + 'static) -> Self;
}
trait ValTx: ValT + Sized {
fn into_vec(self) -> Result<Vec<Self>, Error<Self>> {
self.into_seq().map_err(|v| Error::typ(v, "array"))
}
fn try_as_isize(&self) -> Result<isize, Error<Self>> {
self.as_isize()
.ok_or_else(|| Error::typ(self.clone(), "integer"))
}
#[cfg(feature = "math")]
fn try_as_i32(&self) -> Result<i32, Error<Self>> {
self.try_as_isize()?.try_into().map_err(Error::str)
}
fn try_as_f64(&self) -> Result<f64, Error<Self>> {
self.as_f64()
.ok_or_else(|| Error::typ(self.clone(), "number"))
}
fn mutate_arr(self, f: impl FnOnce(&mut Vec<Self>)) -> ValR<Self> {
let mut a = self.into_vec()?;
f(&mut a);
Ok(Self::from_iter(a))
}
fn try_mutate_arr<'a, F>(self, f: F) -> ValX<'a, Self>
where
F: FnOnce(&mut Vec<Self>) -> Result<(), Exn<'a, Self>>,
{
let mut a = self.into_vec()?;
f(&mut a)?;
Ok(Self::from_iter(a))
}
fn round(self, f: impl FnOnce(f64) -> f64) -> ValR<Self> {
Ok(if self.is_int() {
self
} else {
let f = f(self.try_as_f64()?);
if f.is_finite() {
if isize::MIN as f64 <= f && f <= isize::MAX as f64 {
Self::from(f as isize)
} else {
Self::from_num(&alloc::format!("{f:.0}"))?
}
} else {
Self::from(f)
}
})
}
fn try_as_str(&self) -> Result<&str, Error<Self>> {
self.try_as_utf8_bytes()
.and_then(|s| core::str::from_utf8(s).map_err(Error::str))
}
fn map_utf8_str<B>(self, f: impl FnOnce(&[u8]) -> B) -> ValR<Self>
where
B: AsRef<[u8]> + Send + 'static,
{
Ok(Self::from_utf8_bytes(f(self.try_as_utf8_bytes()?)))
}
fn trim_utf8_with(&self, f: impl FnOnce(&[u8]) -> &[u8]) -> ValR<Self> {
Ok(self.as_sub_str(f(self.try_as_utf8_bytes()?)))
}
fn strip_fix<F>(self, fix: &Self, f: F) -> Result<Self, Error<Self>>
where
F: for<'a> FnOnce(&'a [u8], &[u8]) -> Option<&'a [u8]>,
{
Ok(match f(self.try_as_bytes()?, fix.try_as_bytes()?) {
Some(sub) => self.as_sub_str(sub),
None => self,
})
}
fn fail_str(&self) -> Error<Self> {
Error::typ(self.clone(), "string")
}
}
impl<T: ValT> ValTx for T {}
fn sort_by<'a, V: ValT>(xs: &mut [V], f: impl Fn(V) -> ValXs<'a, V>) -> Result<(), Exn<'a, V>> {
let mut err = None;
xs.sort_by_cached_key(|x| {
if err.is_some() {
return Vec::new();
};
match f(x.clone()).collect() {
Ok(y) => y,
Err(e) => {
err = Some(e);
Vec::new()
}
}
});
err.map_or(Ok(()), Err)
}
fn group_by<'a, V: ValT>(xs: Vec<V>, f: impl Fn(V) -> ValXs<'a, V>) -> ValX<'a, V> {
let mut yx: Vec<(Vec<V>, V)> = xs
.into_iter()
.map(|x| Ok((f(x.clone()).collect::<Result<_, _>>()?, x)))
.collect::<Result<_, Exn<_>>>()?;
yx.sort_by(|(y1, _), (y2, _)| y1.cmp(y2));
let mut grouped = Vec::new();
let mut yx = yx.into_iter();
if let Some((mut group_y, first_x)) = yx.next() {
let mut group = Vec::from([first_x]);
for (y, x) in yx {
if group_y != y {
grouped.push(V::from_iter(core::mem::take(&mut group)));
group_y = y;
}
group.push(x);
}
if !group.is_empty() {
grouped.push(V::from_iter(group));
}
}
Ok(V::from_iter(grouped))
}
fn cmp_by<'a, V: Clone, F, R>(xs: Vec<V>, f: F, replace: R) -> Result<Option<V>, Exn<'a, V>>
where
F: Fn(V) -> ValXs<'a, V>,
R: Fn(&[V], &[V]) -> bool,
{
let iter = xs.into_iter();
let mut iter = iter.map(|x| (x.clone(), f(x).collect::<Result<Vec<_>, _>>()));
let (mut mx, mut my) = if let Some((x, y)) = iter.next() {
(x, y?)
} else {
return Ok(None);
};
for (x, y) in iter {
let y = y?;
if replace(&my, &y) {
(mx, my) = (x, y);
}
}
Ok(Some(mx))
}
fn explode<V: ValT>(s: &[u8]) -> impl Iterator<Item = ValR<V>> + '_ {
let invalid = [].iter();
Explode { s, invalid }.map(|r| match r {
Err(b) => Ok((-(b as isize)).into()),
Ok(c) => Ok(isize::try_from(c as u32).map_err(Error::str)?.into()),
})
}
struct Explode<'a> {
s: &'a [u8],
invalid: core::slice::Iter<'a, u8>,
}
impl Iterator for Explode<'_> {
type Item = Result<char, u8>;
fn next(&mut self) -> Option<Self::Item> {
self.invalid.next().map(|next| Err(*next)).or_else(|| {
let (c, size) = bstr::decode_utf8(self.s);
let (consumed, rest) = self.s.split_at(size);
self.s = rest;
c.map(Ok).or_else(|| {
self.invalid = consumed.iter();
self.invalid.next().map(|next| Err(*next))
})
})
}
fn size_hint(&self) -> (usize, Option<usize>) {
let max = self.s.len();
let min = self.s.len() / 4;
let inv = self.invalid.as_slice().len();
(min + inv, Some(max + inv))
}
}
fn implode<V: ValT>(xs: &[V]) -> Result<Vec<u8>, Error<V>> {
let mut v = Vec::with_capacity(xs.len());
for x in xs {
let i = x.try_as_isize()?;
if let Ok(b) = u8::try_from(-i) {
v.push(b)
} else {
let c = u32::try_from(i).ok().and_then(char::from_u32);
let c = c.ok_or_else(|| Error::str(format_args!("cannot use {i} as character")))?;
v.extend(c.encode_utf8(&mut [0; 4]).as_bytes())
}
}
Ok(v)
}
fn once_or_empty<'a, T: 'a, E: 'a>(r: Result<Option<T>, E>) -> BoxIter<'a, Result<T, E>> {
Box::new(r.transpose().into_iter())
}
#[allow(clippy::unit_arg)]
fn base_run<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
let f = || [Bind::Fun(())].into();
Box::new([
("floor", v(0), |cv| bome(cv.1.round(f64::floor))),
("round", v(0), |cv| bome(cv.1.round(f64::round))),
("ceil", v(0), |cv| bome(cv.1.round(f64::ceil))),
("utf8bytelength", v(0), |cv| {
bome(cv.1.try_as_utf8_bytes().map(|s| (s.len() as isize).into()))
}),
("explode", v(0), |cv| {
bome(cv.1.try_as_utf8_bytes().and_then(|s| explode(s).collect()))
}),
("implode", v(0), |cv| {
let implode = |s: Vec<_>| implode(&s);
bome(cv.1.into_vec().and_then(implode).map(D::V::from_utf8_bytes))
}),
("ascii_downcase", v(0), |cv| {
bome(cv.1.map_utf8_str(ByteSlice::to_ascii_lowercase))
}),
("ascii_upcase", v(0), |cv| {
bome(cv.1.map_utf8_str(ByteSlice::to_ascii_uppercase))
}),
("reverse", v(0), |cv| bome(cv.1.mutate_arr(|a| a.reverse()))),
("sort", v(0), |cv| bome(cv.1.mutate_arr(|a| a.sort()))),
("sort_by", f(), |mut cv| {
let (f, fc) = cv.0.pop_fun();
let f = move |v| f.run((fc.clone(), v));
box_once(cv.1.try_mutate_arr(|a| sort_by(a, f)))
}),
("group_by", f(), |mut cv| {
let (f, fc) = cv.0.pop_fun();
let f = move |v| f.run((fc.clone(), v));
box_once((|| group_by(cv.1.into_vec()?, f))())
}),
("min_by_or_empty", f(), |mut cv| {
let (f, fc) = cv.0.pop_fun();
let f = move |a| cmp_by(a, |v| f.run((fc.clone(), v)), |my, y| y < my);
once_or_empty(cv.1.into_vec().map_err(Exn::from).and_then(f))
}),
("max_by_or_empty", f(), |mut cv| {
let (f, fc) = cv.0.pop_fun();
let f = move |a| cmp_by(a, |v| f.run((fc.clone(), v)), |my, y| y >= my);
once_or_empty(cv.1.into_vec().map_err(Exn::from).and_then(f))
}),
("startswith", v(1), |cv| {
unary(cv, |v, s| {
Ok(v.try_as_bytes()?.starts_with(s.try_as_bytes()?).into())
})
}),
("endswith", v(1), |cv| {
unary(cv, |v, s| {
Ok(v.try_as_bytes()?.ends_with(s.try_as_bytes()?).into())
})
}),
("ltrimstr", v(1), |cv| {
unary(cv, |v, pre| v.strip_fix(&pre, <[u8]>::strip_prefix))
}),
("rtrimstr", v(1), |cv| {
unary(cv, |v, suf| v.strip_fix(&suf, <[u8]>::strip_suffix))
}),
("trim", v(0), |cv| {
bome(cv.1.trim_utf8_with(ByteSlice::trim))
}),
("ltrim", v(0), |cv| {
bome(cv.1.trim_utf8_with(ByteSlice::trim_start))
}),
("rtrim", v(0), |cv| {
bome(cv.1.trim_utf8_with(ByteSlice::trim_end))
}),
("escape_sh", v(0), |cv| {
bome(
cv.1.try_as_utf8_bytes()
.map(|s| ValT::from_utf8_bytes(s.replace(b"'", b"'\\''"))),
)
}),
])
}
#[cfg(feature = "std")]
fn now<V: From<String>>() -> Result<f64, Error<V>> {
use std::time::{SystemTime, UNIX_EPOCH};
SystemTime::now()
.duration_since(UNIX_EPOCH)
.map(|x| x.as_secs_f64())
.map_err(Error::str)
}
#[cfg(feature = "std")]
fn std<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
use std::env::vars;
Box::new([
("env", v(0), |_| {
bome(D::V::from_map(
vars().map(|(k, v)| (D::V::from(k), D::V::from(v))),
))
}),
("now", v(0), |_| bome(now().map(D::V::from))),
("halt", v(1), |mut cv| {
let exit_code = cv.0.pop_var().try_as_isize();
bome(exit_code.map(|exit_code| std::process::exit(exit_code as i32)))
}),
])
}
#[cfg(feature = "format")]
fn replace(s: &[u8], patterns: &[&str], replacements: &[&str]) -> Vec<u8> {
let ac = aho_corasick::AhoCorasick::new(patterns).unwrap();
ac.replace_all_bytes(s, replacements)
}
#[cfg(feature = "format")]
fn format<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
const HTML_PATS: [&str; 5] = ["<", ">", "&", "\'", "\""];
const HTML_REPS: [&str; 5] = ["<", ">", "&", "'", """];
Box::new([
("escape_html", v(0), |cv| {
bome(cv.1.map_utf8_str(|s| replace(s, &HTML_PATS, &HTML_REPS)))
}),
("unescape_html", v(0), |cv| {
bome(cv.1.map_utf8_str(|s| replace(s, &HTML_REPS, &HTML_PATS)))
}),
("encode_uri", v(0), |cv| {
bome(cv.1.map_utf8_str(|s| urlencoding::encode_binary(s).to_string()))
}),
("decode_uri", v(0), |cv| {
bome(cv.1.map_utf8_str(|s| urlencoding::decode_binary(s).to_vec()))
}),
("encode_base64", v(0), |cv| {
use base64::{engine::general_purpose::STANDARD, Engine};
bome(cv.1.map_utf8_str(|s| STANDARD.encode(s)))
}),
("decode_base64", v(0), |cv| {
use base64::{engine::general_purpose::STANDARD, Engine};
bome(cv.1.try_as_utf8_bytes().and_then(|s| {
STANDARD
.decode(s)
.map_err(Error::str)
.map(ValT::from_utf8_bytes)
}))
}),
])
}
#[cfg(feature = "math")]
fn math<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
let rename = |name, (_name, arity, f): Filter<RunPtr<D>>| (name, arity, f);
Box::new([
math::f_f!(acos),
math::f_f!(acosh),
math::f_f!(asin),
math::f_f!(asinh),
math::f_f!(atan),
math::f_f!(atanh),
math::f_f!(cbrt),
math::f_f!(cos),
math::f_f!(cosh),
math::f_f!(erf),
math::f_f!(erfc),
math::f_f!(exp),
math::f_f!(exp10),
math::f_f!(exp2),
math::f_f!(expm1),
math::f_f!(fabs),
math::f_fi!(frexp),
math::f_i!(ilogb),
math::f_f!(j0),
math::f_f!(j1),
math::f_f!(lgamma),
math::f_f!(log),
math::f_f!(log10),
math::f_f!(log1p),
math::f_f!(log2),
math::f_ff!(modf),
rename("nearbyint", math::f_f!(round)),
math::f_f!(rint),
math::f_f!(sin),
math::f_f!(sinh),
math::f_f!(sqrt),
math::f_f!(tan),
math::f_f!(tanh),
math::f_f!(tgamma),
math::f_f!(trunc),
math::f_f!(y0),
math::f_f!(y1),
math::ff_f!(atan2),
math::ff_f!(copysign),
math::ff_f!(fdim),
math::ff_f!(fmax),
math::ff_f!(fmin),
math::ff_f!(fmod),
math::ff_f!(hypot),
math::if_f!(jn),
math::fi_f!(ldexp),
math::ff_f!(nextafter),
math::ff_f!(pow),
math::ff_f!(remainder),
rename("scalbln", math::fi_f!(scalbn)),
math::if_f!(yn),
math::fff_f!(fma),
])
}
#[cfg(feature = "regex")]
fn re<'a, D: DataT>(s: bool, m: bool, mut cv: Cv<'a, D>) -> ValR<D::V<'a>>
where
D::V<'a>: ValT,
{
let flags = cv.0.pop_var();
let re = cv.0.pop_var();
use crate::regex::Part::{Matches, Mismatch};
let fail_flag = |e| Error::str(format_args!("invalid regex flag: {e}"));
let fail_re = |e| Error::str(format_args!("invalid regex: {e}"));
let flags = regex::Flags::new(flags.try_as_str()?).map_err(fail_flag)?;
let re = flags.regex(re.try_as_str()?).map_err(fail_re)?;
let out = regex::regex(cv.1.try_as_utf8_bytes()?, &re, flags, (s, m));
let sub = |s| cv.1.as_sub_str(s);
let out = out.into_iter().map(|out| match out {
Matches(ms) => ms
.into_iter()
.map(|m| D::V::from_map(m.fields(sub)))
.collect(),
Mismatch(s) => Ok(sub(s)),
});
out.collect()
}
#[cfg(feature = "regex")]
fn regex<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
let vv = || [Bind::Var(()), Bind::Var(())].into();
Box::new([
("matches", vv(), |cv| bome(re(false, true, cv))),
("split_matches", vv(), |cv| bome(re(true, true, cv))),
("split_", vv(), |cv| bome(re(true, false, cv))),
])
}
#[cfg(feature = "time")]
fn time<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
use jiff::tz::TimeZone;
Box::new([
("fromdateiso8601", v(0), |cv| {
bome(cv.1.try_as_str().and_then(time::from_iso8601))
}),
("todateiso8601", v(0), |cv| {
bome(time::to_iso8601(&cv.1).map(D::V::from))
}),
("strftime", v(1), |cv| {
unary(cv, |v, fmt| {
time::strftime(&v, fmt.try_as_str()?, TimeZone::UTC)
})
}),
("strflocaltime", v(1), |cv| {
unary(cv, |v, fmt| {
time::strftime(&v, fmt.try_as_str()?, TimeZone::system())
})
}),
("gmtime", v(0), |cv| {
bome(time::gmtime(&cv.1, TimeZone::UTC))
}),
("localtime", v(0), |cv| {
bome(time::gmtime(&cv.1, TimeZone::system()))
}),
("strptime", v(1), |cv| {
unary(cv, |v, fmt| {
time::strptime(v.try_as_str()?, fmt.try_as_str()?)
})
}),
("mktime", v(0), |cv| bome(time::mktime(&cv.1))),
])
}
#[cfg(feature = "log")]
fn log<D: DataT>() -> Box<[Filter<RunPtr<D>>]>
where
for<'a> D::V<'a>: ValT,
{
fn eprint_raw<V: ValT>(v: &V) {
if let Some(s) = v.as_utf8_bytes() {
log::error!("{}", BStr::new(s))
} else {
log::error!("{v}")
}
}
macro_rules! empty_with {
( $eff:expr ) => {
|cv| {
$eff(&cv.1);
Box::new(core::iter::empty())
}
};
}
Box::new([
("debug_empty", v(0), empty_with!(|x| log::debug!("{x}"))),
("stderr_empty", v(0), empty_with!(eprint_raw)),
])
}