use std::process::Command;
pub fn validate_structural(code: &str, backend_name: &str) -> Vec<String> {
match backend_name {
"python-psycopg3" | "python-asyncpg" | "python-aiomysql" | "python-aiosqlite" => {
validate_python(code)
}
"typescript-postgres"
| "typescript-pg"
| "typescript-mysql2"
| "typescript-better-sqlite3" => validate_typescript(code),
"go-pgx" => validate_go(code),
"java-jdbc" => validate_java(code),
"kotlin-jdbc" => validate_kotlin(code),
"csharp-npgsql" => validate_csharp(code),
"elixir-postgrex" | "elixir-ecto" => validate_elixir(code),
"ruby-pg" | "ruby-mysql2" | "ruby-sqlite3" | "ruby-trilogy" => validate_ruby(code),
"php-pdo" | "php-amphp" => validate_php(code),
"rust-sqlx" | "rust-tokio-postgres" => vec![],
_ => vec![format!("unknown backend: {}", backend_name)],
}
}
fn validate_python(code: &str) -> Vec<String> {
let mut errors = Vec::new();
if code.contains("from __future__ import annotations") {
errors.push(
"unnecessary `from __future__ import annotations` — target is Python 3.10+".into(),
);
}
let has_struct = code.contains("@dataclass")
|| code.contains("(BaseModel)")
|| code.contains("(msgspec.Struct)")
|| code.contains("class ");
if !has_struct {
if !code.contains("async def ") && !code.contains("def ") {
errors.push("missing `@dataclass`/`class` and `def ` -- no meaningful output".into());
}
}
if !code.contains("async def ") && !code.contains("def ") {
errors.push("missing `async def ` or `def ` (for query functions)".into());
}
if code.contains("from typing import Union") {
errors.push("contains `from typing import Union` (pre-3.10 style)".into());
}
if code.contains("from typing import Optional") {
errors.push("contains `from typing import Optional` (pre-3.10 style)".into());
}
if code.contains("List[") {
errors.push("contains `List[` (use lowercase `list[`)".into());
}
if code.contains("Dict[") {
errors.push("contains `Dict[` (use lowercase `dict[`)".into());
}
for (i, line) in code.lines().enumerate() {
if line.starts_with('\t') {
errors.push(format!(
"line {} uses tab indentation (should use 4 spaces)",
i + 1
));
break; }
}
errors
}
fn validate_typescript(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_function = code.contains("export async function") || code.contains("export function");
let has_zod = code.contains("z.object(") || code.contains("z.infer<");
if !code.contains("export interface")
&& !code.contains("export type")
&& !has_zod
&& !has_function
{
errors.push("missing `export interface` or `export type` (for DTOs)".into());
}
if !has_function {
errors.push("missing `export async function` or `export function`".into());
}
for line in code.lines() {
let trimmed = line.trim();
if trimmed.contains(": any")
|| trimmed.contains("<any>")
|| trimmed.contains("any;")
|| trimmed.contains("any,")
|| trimmed.contains("any)")
{
errors.push(format!(
"contains `any` type (should use `unknown` or specific): {}",
trimmed
));
break;
}
}
errors
}
fn validate_go(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_func = code.contains("func ");
let has_struct = code.contains("type ") && code.contains("struct {");
if !has_struct && !has_func {
errors.push("missing `type ... struct {` (for structs)".into());
}
if !has_func {
errors.push("missing `func ` (for functions)".into());
}
if !code.contains("context.Context") {
errors.push("missing `context.Context` as first param".into());
}
let has_indented_lines = code
.lines()
.any(|l| l.starts_with('\t') || l.starts_with(" "));
if has_indented_lines {
let uses_spaces = code
.lines()
.any(|l| l.starts_with(" ") && !l.trim().is_empty());
if uses_spaces {
errors.push("uses space indentation (Go standard is tabs)".into());
}
}
if has_struct && !code.contains("json:\"") {
errors.push("missing `json:\"` tags on struct fields".into());
}
errors
}
fn validate_java(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_static = code.contains("public static ");
if !code.contains("public record ") && !has_static {
errors.push("missing `public record ` (for DTOs)".into());
}
if !has_static {
errors.push("missing `public static ` (for query methods)".into());
}
if !code.contains("throws SQLException") {
errors.push("missing `throws SQLException`".into());
}
if !code.contains("try (") {
errors.push("missing `try (` (try-with-resources)".into());
}
errors
}
fn validate_kotlin(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_fun = code.contains("fun ");
if !code.contains("data class ") && !has_fun {
errors.push("missing `data class ` (for DTOs)".into());
}
if !has_fun {
errors.push("missing `fun ` (for functions)".into());
}
if !code.contains(".use {") {
errors.push("missing `.use {` (resource management)".into());
}
errors
}
fn validate_csharp(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_async = code.contains("async Task<") || code.contains("async Task ");
if !code.contains("public record ") && !has_async {
errors.push("missing `public record ` (for DTOs)".into());
}
if !has_async {
errors.push("missing `async Task<` or `async Task` (for async methods)".into());
}
if !code.contains("await ") {
errors.push("missing `await `".into());
}
errors
}
fn validate_elixir(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_def = code.contains("def ") || code.contains("defp ");
if !code.contains("defmodule ") && !has_def {
errors.push("missing `defmodule ` (for modules)".into());
}
if !code.contains("defstruct") && !has_def {
errors.push("missing `defstruct` (for structs)".into());
}
if !has_def {
errors.push("missing `def ` or `defp ` (for functions)".into());
}
if !code.contains("@type ") && !code.contains("@spec ") {
errors.push("missing `@type ` or `@spec ` (for typespecs)".into());
}
errors
}
fn validate_ruby(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_method = code.contains("def self.");
if !code.contains("Data.define") && !has_method {
errors.push("missing `Data.define` (for DTOs)".into());
}
if !has_method {
errors.push("missing `def self.` (for module methods)".into());
}
if !code.contains("# frozen_string_literal: true") {
errors.push("missing `# frozen_string_literal: true`".into());
}
if !code.contains("module Queries") {
errors.push("missing `module Queries` wrapper".into());
}
errors
}
fn validate_php(code: &str) -> Vec<String> {
let mut errors = Vec::new();
let has_function = code.contains("function ");
if !code.contains("readonly class ") && !has_function {
errors.push("missing `readonly class ` (for DTOs)".into());
}
if !has_function {
errors.push("missing `function ` (for query functions)".into());
}
if !code.contains("declare(strict_types=1)") {
errors.push("missing `declare(strict_types=1)`".into());
}
if !code.contains("<?php") {
errors.push("missing `<?php`".into());
}
errors
}
pub fn validate_with_tools(code: &str, backend_name: &str) -> Option<Vec<String>> {
match backend_name {
name if name.starts_with("python") => validate_python_tools(code),
name if name.starts_with("typescript") => validate_typescript_tools(code),
name if name.starts_with("go") => validate_go_tools(code),
name if name.starts_with("ruby") => validate_ruby_tools(code),
name if name.starts_with("php") => validate_php_tools(code),
name if name.starts_with("kotlin") => validate_kotlin_tools(code),
_ => None,
}
}
fn write_temp(code: &str, ext: &str) -> Option<std::path::PathBuf> {
use std::sync::atomic::{AtomicU64, Ordering};
static COUNTER: AtomicU64 = AtomicU64::new(0);
let n = COUNTER.fetch_add(1, Ordering::Relaxed);
let basename = if ext == ".kt" {
format!("ScytheValidate{n}")
} else {
format!("scythe_validate_{n}")
};
let path = std::env::temp_dir().join(format!("{basename}{ext}"));
let trimmed = format!("{}\n", code.trim_end());
std::fs::write(&path, trimmed).ok()?;
Some(path)
}
fn validate_python_tools(code: &str) -> Option<Vec<String>> {
if Command::new("python3").arg("--version").output().is_err() {
return None;
}
let path = write_temp(code, ".py")?;
let mut errors = vec![];
let out = Command::new("python3")
.args([
"-c",
&format!("import ast; ast.parse(open({:?}).read())", path),
])
.output()
.ok()?;
if !out.status.success() {
errors.push(format!(
"python syntax: {}",
String::from_utf8_lossy(&out.stderr)
.lines()
.next()
.unwrap_or("")
));
}
if Command::new("ruff").arg("--version").output().is_ok() {
let out = Command::new("ruff")
.args([
"check",
"--select",
"E,F,I",
"--target-version",
"py310",
path.to_str()?,
])
.output()
.ok()?;
if !out.status.success() {
for line in String::from_utf8_lossy(&out.stdout).lines().take(3) {
if !line.trim().is_empty() {
errors.push(format!("ruff: {line}"));
}
}
}
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
fn validate_typescript_tools(code: &str) -> Option<Vec<String>> {
if Command::new("biome").arg("--version").output().is_err() {
return None;
}
let path = write_temp(code, ".ts")?;
let mut errors = vec![];
let out = Command::new("biome")
.args(["check", "--no-errors-on-unmatched", path.to_str()?])
.output()
.ok()?;
if !out.status.success() {
for line in String::from_utf8_lossy(&out.stderr).lines().take(3) {
if !line.trim().is_empty() {
errors.push(format!("biome: {line}"));
}
}
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
fn validate_go_tools(code: &str) -> Option<Vec<String>> {
if Command::new("gofmt").arg("-h").output().is_err() {
return None;
}
let path = write_temp(code, ".go")?;
let mut errors = vec![];
let out = Command::new("gofmt")
.args(["-e", path.to_str()?])
.output()
.ok()?;
if !out.status.success() {
for line in String::from_utf8_lossy(&out.stderr).lines().take(3) {
if !line.trim().is_empty() {
errors.push(format!("gofmt: {line}"));
}
}
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
fn validate_ruby_tools(code: &str) -> Option<Vec<String>> {
if Command::new("ruby").arg("--version").output().is_err() {
return None;
}
let path = write_temp(code, ".rb")?;
let mut errors = vec![];
let out = Command::new("ruby")
.args(["-c", path.to_str()?])
.output()
.ok()?;
if !out.status.success() {
errors.push(format!(
"ruby syntax: {}",
String::from_utf8_lossy(&out.stderr)
.lines()
.next()
.unwrap_or("")
));
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
fn validate_php_tools(code: &str) -> Option<Vec<String>> {
if Command::new("php").arg("--version").output().is_err() {
return None;
}
let path = write_temp(code, ".php")?;
let mut errors = vec![];
let out = Command::new("php")
.args(["-l", path.to_str()?])
.output()
.ok()?;
if !out.status.success() {
errors.push(format!(
"php syntax: {}",
String::from_utf8_lossy(&out.stdout)
.lines()
.next()
.unwrap_or("")
));
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
fn validate_kotlin_tools(code: &str) -> Option<Vec<String>> {
if Command::new("ktlint").arg("--version").output().is_err() {
return None;
}
let path = write_temp(code, ".kt")?;
let mut errors = vec![];
let out = Command::new("ktlint")
.args(["--log-level=error", path.to_str()?])
.output()
.ok()?;
if !out.status.success() {
for line in String::from_utf8_lossy(&out.stdout).lines().take(3) {
if !line.trim().is_empty() {
errors.push(format!("ktlint: {line}"));
}
}
}
let _ = std::fs::remove_file(&path);
Some(errors)
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_unknown_backend() {
let errors = validate_structural("some code", "unknown-backend");
assert_eq!(errors.len(), 1);
assert!(errors[0].contains("unknown backend"));
}
#[test]
fn test_rust_backends_skip() {
assert!(validate_structural("anything", "rust-sqlx").is_empty());
assert!(validate_structural("anything", "rust-tokio-postgres").is_empty());
}
#[test]
fn test_python_valid() {
let code = r#"from dataclasses import dataclass
@dataclass
class ListUsersRow:
id: int
name: str
async def list_users(conn) -> list[ListUsersRow]:
pass
"#;
let errors = validate_structural(code, "python-psycopg3");
assert!(errors.is_empty(), "expected no errors, got: {:?}", errors);
}
#[test]
fn test_python_invalid_typing() {
let code = r#"from typing import Optional
@dataclass
class Row:
id: int
def query() -> List[Row]:
pass
"#;
let errors = validate_structural(code, "python-asyncpg");
assert!(errors.iter().any(|e| e.contains("Optional")));
assert!(errors.iter().any(|e| e.contains("List[")));
}
#[test]
fn test_typescript_valid() {
let code = r#"export interface ListUsersRow {
id: number;
name: string;
}
export async function listUsers(): Promise<ListUsersRow[]> {
// ...
}
"#;
let errors = validate_structural(code, "typescript-postgres");
assert!(errors.is_empty(), "expected no errors, got: {:?}", errors);
}
#[test]
fn test_go_valid() {
let code = "package db\n\nimport (\n\t\"context\"\n\t\"encoding/json\"\n)\n\ntype ListUsersRow struct {\n\tID int `json:\"id\"`\n\tName string `json:\"name\"`\n}\n\nfunc ListUsers(ctx context.Context) ([]ListUsersRow, error) {\n\treturn nil, nil\n}\n";
let errors = validate_structural(code, "go-pgx");
assert!(errors.is_empty(), "expected no errors, got: {:?}", errors);
}
#[test]
fn test_php_valid() {
let code = r#"<?php
declare(strict_types=1);
readonly class ListUsersRow {
public function __construct(
public int $id,
public string $name,
) {}
}
function listUsers($pdo): array {
return [];
}
"#;
let errors = validate_structural(code, "php-pdo");
assert!(errors.is_empty(), "expected no errors, got: {:?}", errors);
}
}