use std::borrow::Cow;
use crate::concat_string;
#[derive(Debug, Clone)]
pub enum HybridRegex {
Optimize(regex::Regex),
Ecma(regress::Regex),
}
impl From<&str> for HybridRegex {
fn from(pattern: &str) -> Self {
HybridRegex::new(pattern).unwrap_or_else(|err| {
panic!("failed to create HybridRegex from {pattern}, error details: {err}",)
})
}
}
impl HybridRegex {
pub fn new(pattern: &str) -> anyhow::Result<Self> {
let regex_pattern = Self::get_regex_pattern(pattern, "");
match regex::Regex::new(®ex_pattern).map(HybridRegex::Optimize) {
Ok(reg) => Ok(reg),
Err(_) => regress::Regex::new(pattern).map(HybridRegex::Ecma).map_err(anyhow::Error::from),
}
}
pub fn with_flags(pattern: &str, flags: &str) -> anyhow::Result<Self> {
let regex_pattern = Self::get_regex_pattern(pattern, flags);
match regex::Regex::new(®ex_pattern).map(HybridRegex::Optimize) {
Ok(reg) => Ok(reg),
Err(_) => regress::Regex::with_flags(pattern, flags)
.map(HybridRegex::Ecma)
.map_err(anyhow::Error::from),
}
}
pub fn regex_pattern(&self) -> Option<&str> {
match self {
HybridRegex::Optimize(r) => Some(r.as_str()),
HybridRegex::Ecma(_) => None,
}
}
fn get_regex_pattern(pattern: &str, flags: &str) -> String {
concat_string!("(?R", flags, ")", pattern)
}
pub fn matches(&self, text: &str) -> bool {
match self {
HybridRegex::Optimize(reg) => reg.is_match(text),
HybridRegex::Ecma(reg) => reg.find(text).is_some(),
}
}
pub fn replace<'a>(&self, haystack: &'a str, replacement: &str) -> Cow<'a, str> {
match self {
HybridRegex::Optimize(r) => r.replace(haystack, replacement),
HybridRegex::Ecma(reg) => {
let next = reg.find_iter(haystack).next();
let Some(m) = next else { return Cow::Borrowed(haystack) };
Cow::Owned(concat_string!(&haystack[..m.start()], replacement, &haystack[m.end()..]))
}
}
}
pub fn replace_all<'a>(&self, haystack: &'a str, replacement: &str) -> Cow<'a, str> {
match self {
HybridRegex::Optimize(r) => r.replace_all(haystack, replacement),
HybridRegex::Ecma(reg) => regress_regexp_replace_all(reg, haystack, replacement),
}
}
}
fn regress_regexp_replace_all<'h>(
reg: ®ress::Regex,
haystack: &'h str,
replacement: &str,
) -> Cow<'h, str> {
let iter = reg.find_iter(haystack);
let mut iter = iter.peekable();
if iter.peek().is_none() {
return Cow::Borrowed(haystack);
}
let mut ret = String::with_capacity(haystack.len());
let mut last = 0;
for m in iter {
ret.push_str(&haystack[last..m.start()]);
ret.push_str(replacement);
last = m.end();
}
ret.push_str(&haystack[last..]);
Cow::Owned(ret)
}
#[cfg(test)]
mod test {
use crate::js_regex::{HybridRegex, regress_regexp_replace_all};
#[test]
fn with_flags() {
let reg = HybridRegex::with_flags("a", "i").unwrap();
assert!(reg.matches("A"));
let reg = HybridRegex::new("a").unwrap();
assert!(!reg.matches("A"));
}
#[test]
fn regress_replace_all() {
let reg = regress::Regex::new("\\d+").unwrap();
assert_eq!(regress_regexp_replace_all(®, "111aa111", "1"), "1aa1");
}
#[test]
fn js_regex_compat_dot() {
let dot_reg = HybridRegex::new(".").unwrap();
assert!(!dot_reg.matches("\n"));
assert!(!dot_reg.matches("\r\n"));
let dots_reg = HybridRegex::with_flags(".", "s").unwrap();
assert!(dots_reg.matches("\n"));
assert!(dots_reg.matches("\r\n"));
assert!(dots_reg.matches("\u{2028}"));
assert!(dots_reg.matches("\u{2029}"));
}
#[test]
fn js_regex_compat_multiline() {
let reg = HybridRegex::with_flags("a$", "m").unwrap();
assert!(reg.matches("a\n"));
assert!(reg.matches("a\r\n"));
}
}