mod bash;
mod cpp;
mod csharp;
mod css;
mod elixir;
mod go;
mod json;
mod kotlin;
mod lua;
mod parsers;
mod php;
mod python;
mod ruby;
mod rust;
mod scala;
mod swift;
use ast_grep_core::language::TSLanguage;
use ast_grep_core::meta_var::MetaVariable;
use ignore::types::{Types, TypesBuilder};
use serde::{de, Deserialize, Deserializer, Serialize};
use std::borrow::Cow;
use std::fmt;
use std::fmt::{Display, Formatter};
use std::path::Path;
use std::str::FromStr;
pub use ast_grep_core::Language;
macro_rules! impl_lang {
($lang: ident, $func: ident) => {
#[derive(Clone, Copy)]
pub struct $lang;
impl Language for $lang {
fn get_ts_language(&self) -> TSLanguage {
parsers::$func().into()
}
}
};
}
macro_rules! impl_lang_expando {
($lang: ident, $func: ident, $char: expr) => {
#[derive(Clone, Copy)]
pub struct $lang;
impl ast_grep_core::language::Language for $lang {
fn get_ts_language(&self) -> ast_grep_core::language::TSLanguage {
$crate::parsers::$func().into()
}
fn expando_char(&self) -> char {
$char
}
fn pre_process_pattern<'q>(&self, query: &'q str) -> std::borrow::Cow<'q, str> {
let mut buf = [0; 4];
let expando = self.expando_char().encode_utf8(&mut buf);
let replaced = query.replace(self.meta_var_char(), expando);
std::borrow::Cow::Owned(replaced)
}
}
};
}
impl_lang_expando!(C, language_c, '_');
impl_lang_expando!(Cpp, language_cpp, '_');
impl_lang_expando!(CSharp, language_c_sharp, 'µ');
impl_lang_expando!(Css, language_css, '_');
impl_lang_expando!(Elixir, language_elixir, 'µ');
impl_lang_expando!(Go, language_go, 'µ');
impl_lang_expando!(Kotlin, language_kotlin, 'µ');
impl_lang_expando!(Python, language_python, 'µ');
impl_lang_expando!(Ruby, language_ruby, 'µ');
impl_lang_expando!(Rust, language_rust, 'µ');
impl_lang_expando!(Swift, language_swift, 'µ');
impl_lang!(Bash, language_bash);
impl_lang!(Dart, language_dart);
impl_lang!(Html, language_html);
impl_lang!(Java, language_java);
impl_lang!(JavaScript, language_javascript);
impl_lang!(Json, language_json);
impl_lang!(Lua, language_lua);
impl_lang!(Php, language_php);
impl_lang!(Scala, language_scala);
impl_lang!(Tsx, language_tsx);
impl_lang!(TypeScript, language_typescript);
#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Hash)]
pub enum SupportLang {
Bash,
C,
Cpp,
CSharp,
Css,
Dart,
Go,
Elixir,
Html,
Java,
JavaScript,
Json,
Kotlin,
Lua,
Php,
Python,
Ruby,
Rust,
Scala,
Swift,
Tsx,
TypeScript,
}
impl SupportLang {
pub const fn all_langs() -> &'static [SupportLang] {
use SupportLang::*;
&[
Bash, C, Cpp, CSharp, Css, Dart, Elixir, Go, Html, Java, JavaScript, Json, Kotlin, Lua, Php,
Python, Ruby, Rust, Scala, Swift, Tsx, TypeScript,
]
}
pub fn file_types(&self) -> Types {
file_types(self)
}
}
impl fmt::Display for SupportLang {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
write!(f, "{:?}", self)
}
}
#[derive(Debug)]
pub enum SupportLangErr {
LanguageNotSupported(String),
}
impl Display for SupportLangErr {
fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), std::fmt::Error> {
use SupportLangErr::*;
match self {
LanguageNotSupported(lang) => write!(f, "{} is not supported!", lang),
}
}
}
impl std::error::Error for SupportLangErr {}
impl<'de> Deserialize<'de> for SupportLang {
fn deserialize<D>(deserializer: D) -> Result<Self, D::Error>
where
D: Deserializer<'de>,
{
let s = String::deserialize(deserializer)?;
FromStr::from_str(&s).map_err(de::Error::custom)
}
}
const fn alias(lang: &SupportLang) -> &[&str] {
use SupportLang::*;
match lang {
Bash => &["bash-exp"],
C => &["c"],
Cpp => &["cc", "c++", "cpp", "cxx"],
CSharp => &["cs", "csharp"],
Css => &["css"],
Dart => &["dart"],
Elixir => &["ex", "elixir"],
Go => &["go", "golang"],
Html => &["html"],
Java => &["java"],
JavaScript => &["javascript", "js", "jsx"],
Json => &["json"],
Kotlin => &["kotlin", "kt"],
Lua => &["lua"],
Php => &["php-exp"],
Python => &["py", "python"],
Ruby => &["rb", "ruby"],
Rust => &["rs", "rust"],
Scala => &["scala"],
Swift => &["swift"],
TypeScript => &["ts", "typescript"],
Tsx => &["tsx"],
}
}
impl FromStr for SupportLang {
type Err = SupportLangErr;
fn from_str(s: &str) -> Result<Self, Self::Err> {
for lang in Self::all_langs() {
for moniker in alias(lang) {
if s.eq_ignore_ascii_case(moniker) {
return Ok(*lang);
}
}
}
Err(SupportLangErr::LanguageNotSupported(s.to_string()))
}
}
macro_rules! execute_lang_method {
($me: path, $method: ident, $($pname:tt),*) => {
use SupportLang as S;
match $me {
S::Bash => Bash.$method($($pname,)*),
S::C => C.$method($($pname,)*),
S::Cpp => Cpp.$method($($pname,)*),
S::CSharp => CSharp.$method($($pname,)*),
S::Css => Css.$method($($pname,)*),
S::Dart => Dart.$method($($pname,)*),
S::Elixir => Elixir.$method($($pname,)*),
S::Go => Go.$method($($pname,)*),
S::Html => Html.$method($($pname,)*),
S::Java => Java.$method($($pname,)*),
S::JavaScript => JavaScript.$method($($pname,)*),
S::Json => Json.$method($($pname,)*),
S::Kotlin => Kotlin.$method($($pname,)*),
S::Lua => Lua.$method($($pname,)*),
S::Php => Php.$method($($pname,)*),
S::Python => Python.$method($($pname,)*),
S::Ruby => Ruby.$method($($pname,)*),
S::Rust => Rust.$method($($pname,)*),
S::Scala => Scala.$method($($pname,)*),
S::Swift => Swift.$method($($pname,)*),
S::Tsx => Tsx.$method($($pname,)*),
S::TypeScript => TypeScript.$method($($pname,)*),
}
}
}
macro_rules! impl_lang_method {
($method: ident, ($($pname:tt: $ptype:ty),*) => $return_type: ty) => {
#[inline]
fn $method(&self, $($pname: $ptype),*) -> $return_type {
execute_lang_method!{ self, $method, $($pname),* }
}
};
}
impl Language for SupportLang {
fn from_path<P: AsRef<Path>>(path: P) -> Option<Self> {
from_extension(path.as_ref())
}
impl_lang_method!(get_ts_language, () => TSLanguage);
impl_lang_method!(meta_var_char, () => char);
impl_lang_method!(expando_char, () => char);
impl_lang_method!(extract_meta_var, (source: &str) => Option<MetaVariable>);
fn pre_process_pattern<'q>(&self, query: &'q str) -> Cow<'q, str> {
execute_lang_method! { self, pre_process_pattern, query }
}
}
fn extensions(lang: &SupportLang) -> &[&str] {
use SupportLang::*;
match lang {
Bash => &[
"bash", "bats", "cgi", "command", "env", "fcgi", "ksh", "sh", "tmux", "tool", "zsh",
],
C => &["c", "h"],
Cpp => &["cc", "hpp", "cpp", "c++", "hh", "cxx", "cu", "ino"],
CSharp => &["cs"],
Css => &["css", "scss"],
Dart => &["dart"],
Elixir => &["ex", "exs"],
Go => &["go"],
Html => &["html", "htm", "xhtml"],
Java => &["java"],
JavaScript => &["cjs", "js", "mjs", "jsx"],
Json => &["json"],
Kotlin => &["kt", "ktm", "kts"],
Lua => &["lua"],
Php => &["php"],
Python => &["py", "py3", "pyi", "bzl"],
Ruby => &["rb", "rbw", "gemspec"],
Rust => &["rs"],
Scala => &["scala", "sc", "sbt"],
Swift => &["swift"],
TypeScript => &["ts", "cts", "mts"],
Tsx => &["tsx"],
}
}
fn from_extension(path: &Path) -> Option<SupportLang> {
let ext = path.extension()?.to_str()?;
SupportLang::all_langs()
.iter()
.copied()
.find(|l| extensions(l).contains(&ext))
}
fn add_custom_file_type<'b>(
builder: &'b mut TypesBuilder,
file_type: &str,
suffix_list: &[&str],
) -> &'b mut TypesBuilder {
for suffix in suffix_list {
let glob = format!("*.{suffix}");
builder
.add(file_type, &glob)
.expect("file pattern must compile");
}
builder.select(file_type)
}
fn file_types(lang: &SupportLang) -> Types {
let mut builder = TypesBuilder::new();
let exts = extensions(lang);
let lang_name = lang.to_string();
add_custom_file_type(&mut builder, &lang_name, exts);
builder.build().expect("file type must be valid")
}
pub fn config_file_type() -> Types {
let mut builder = TypesBuilder::new();
let builder = add_custom_file_type(&mut builder, "yml", &["yml", "yaml"]);
builder.build().expect("yaml type must be valid")
}
#[cfg(test)]
mod test {
use super::*;
use ast_grep_core::{source::TSParseError, Matcher, Pattern};
pub fn test_match_lang(query: &str, source: &str, lang: impl Language) {
let cand = lang.ast_grep(source);
let pattern = Pattern::str(query, lang);
assert!(
pattern.find_node(cand.root()).is_some(),
"goal: {pattern:?}, candidate: {}",
cand.root().to_sexp(),
);
}
pub fn test_non_match_lang(query: &str, source: &str, lang: impl Language) {
let cand = lang.ast_grep(source);
let pattern = Pattern::str(query, lang);
assert!(
pattern.find_node(cand.root()).is_none(),
"goal: {pattern:?}, candidate: {}",
cand.root().to_sexp(),
);
}
pub fn test_replace_lang(
src: &str,
pattern: &str,
replacer: &str,
lang: impl Language,
) -> Result<String, TSParseError> {
let mut source = lang.ast_grep(src);
let replacer = lang.pre_process_pattern(replacer);
let replacer = lang.ast_grep(replacer).inner;
assert!(source.replace(pattern, replacer)?);
Ok(source.generate())
}
#[test]
fn test_js_string() {
test_match_lang("'a'", "'a'", JavaScript);
test_match_lang("\"\"", "\"\"", JavaScript);
test_match_lang("''", "''", JavaScript);
}
#[test]
fn test_guess_by_extension() {
let path = Path::new("foo.rs");
assert_eq!(from_extension(path), Some(SupportLang::Rust));
}
}