use crate::parser::language::{
Export, Import, LanguageSupport, ParseResult, Symbol, SymbolKind, Visibility,
};
use tree_sitter::Language as TsLanguage;
pub struct JavaLanguage;
impl JavaLanguage {
fn node_text<'a>(node: &tree_sitter::Node, source: &'a [u8]) -> &'a str {
node.utf8_text(source).unwrap_or("")
}
fn first_line(node: &tree_sitter::Node, source: &[u8]) -> String {
let text = Self::node_text(node, source);
text.lines().next().unwrap_or("").trim().to_string()
}
fn extract_name(node: &tree_sitter::Node, source: &[u8]) -> String {
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
if child.kind() == "identifier" {
return Self::node_text(&child, source).to_string();
}
}
String::new()
}
fn extract_visibility(node: &tree_sitter::Node, source: &[u8]) -> Visibility {
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
if child.kind() == "modifiers" {
let text = Self::node_text(&child, source);
if text.contains("public") {
return Visibility::Public;
}
return Visibility::Private;
}
}
Visibility::Private
}
fn extract_fn_signature(node: &tree_sitter::Node, source: &[u8]) -> String {
let full_text = Self::node_text(node, source);
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
if child.kind() == "block" {
let body_start = child.start_byte() - node.start_byte();
return full_text[..body_start].trim().to_string();
}
}
full_text.lines().next().unwrap_or("").trim().to_string()
}
fn extract_fn_body(node: &tree_sitter::Node, source: &[u8]) -> String {
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
if child.kind() == "block" {
let text = &source[child.start_byte()..child.end_byte()];
return String::from_utf8_lossy(text).into_owned();
}
}
String::new()
}
fn extract_import(node: &tree_sitter::Node, source: &[u8]) -> Option<Import> {
let text = Self::node_text(node, source);
let inner = text
.trim_start_matches("import")
.trim()
.trim_start_matches("static")
.trim()
.trim_end_matches(';')
.trim();
if inner.is_empty() {
return None;
}
if inner.ends_with(".*") {
let source_path = inner.trim_end_matches(".*").to_string();
return Some(Import {
source: source_path,
names: vec!["*".to_string()],
});
}
if let Some(sep) = inner.rfind('.') {
let source_path = inner[..sep].to_string();
let name = inner[sep + 1..].to_string();
Some(Import {
source: source_path,
names: vec![name],
})
} else {
Some(Import {
source: String::new(),
names: vec![inner.to_string()],
})
}
}
}
impl LanguageSupport for JavaLanguage {
fn ts_language(&self) -> TsLanguage {
tree_sitter_java::LANGUAGE.into()
}
fn name(&self) -> &str {
"java"
}
fn extract(&self, source: &str, tree: &tree_sitter::Tree) -> ParseResult {
let source_bytes = source.as_bytes();
let root = tree.root_node();
let mut symbols: Vec<Symbol> = Vec::new();
let mut imports: Vec<Import> = Vec::new();
let mut exports: Vec<Export> = Vec::new();
let mut stack: Vec<tree_sitter::Node> = root.children(&mut root.walk()).collect();
while let Some(node) = stack.pop() {
match node.kind() {
"import_declaration" => {
if let Some(import) = Self::extract_import(&node, source_bytes) {
imports.push(import);
}
}
"class_declaration" => {
let name = Self::extract_name(&node, source_bytes);
let visibility = Self::extract_visibility(&node, source_bytes);
let is_pub = visibility == Visibility::Public;
let signature = Self::first_line(&node, source_bytes);
let body = Self::node_text(&node, source_bytes).to_string();
let start_line = node.start_position().row + 1;
let end_line = node.end_position().row + 1;
if is_pub {
exports.push(Export {
name: name.clone(),
kind: SymbolKind::Class,
});
}
symbols.push(Symbol {
name,
kind: SymbolKind::Class,
visibility,
signature,
body,
start_line,
end_line,
});
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
stack.push(child);
}
}
"interface_declaration" => {
let name = Self::extract_name(&node, source_bytes);
let visibility = Self::extract_visibility(&node, source_bytes);
let is_pub = visibility == Visibility::Public;
let signature = Self::first_line(&node, source_bytes);
let body = Self::node_text(&node, source_bytes).to_string();
let start_line = node.start_position().row + 1;
let end_line = node.end_position().row + 1;
if is_pub {
exports.push(Export {
name: name.clone(),
kind: SymbolKind::Interface,
});
}
symbols.push(Symbol {
name,
kind: SymbolKind::Interface,
visibility,
signature,
body,
start_line,
end_line,
});
}
"enum_declaration" => {
let name = Self::extract_name(&node, source_bytes);
let visibility = Self::extract_visibility(&node, source_bytes);
let is_pub = visibility == Visibility::Public;
let signature = Self::first_line(&node, source_bytes);
let body = Self::node_text(&node, source_bytes).to_string();
let start_line = node.start_position().row + 1;
let end_line = node.end_position().row + 1;
if is_pub {
exports.push(Export {
name: name.clone(),
kind: SymbolKind::Enum,
});
}
symbols.push(Symbol {
name,
kind: SymbolKind::Enum,
visibility,
signature,
body,
start_line,
end_line,
});
}
"method_declaration" => {
let name = Self::extract_name(&node, source_bytes);
let visibility = Self::extract_visibility(&node, source_bytes);
let is_pub = visibility == Visibility::Public;
let signature = Self::extract_fn_signature(&node, source_bytes);
let body = Self::extract_fn_body(&node, source_bytes);
let start_line = node.start_position().row + 1;
let end_line = node.end_position().row + 1;
if is_pub {
exports.push(Export {
name: name.clone(),
kind: SymbolKind::Method,
});
}
symbols.push(Symbol {
name,
kind: SymbolKind::Method,
visibility,
signature,
body,
start_line,
end_line,
});
}
"constructor_declaration" => {
let name = Self::extract_name(&node, source_bytes);
let visibility = Self::extract_visibility(&node, source_bytes);
let is_pub = visibility == Visibility::Public;
let signature = Self::extract_fn_signature(&node, source_bytes);
let body = Self::extract_fn_body(&node, source_bytes);
let start_line = node.start_position().row + 1;
let end_line = node.end_position().row + 1;
if is_pub {
exports.push(Export {
name: name.clone(),
kind: SymbolKind::Method,
});
}
symbols.push(Symbol {
name,
kind: SymbolKind::Method,
visibility,
signature,
body,
start_line,
end_line,
});
}
"class_body" | "interface_body" | "enum_body" => {
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
stack.push(child);
}
}
_ => {}
}
}
ParseResult {
symbols,
imports,
exports,
}
}
}
#[cfg(test)]
mod tests {
use super::*;
use crate::parser::language::{SymbolKind, Visibility};
fn make_parser() -> tree_sitter::Parser {
let mut parser = tree_sitter::Parser::new();
parser
.set_language(&tree_sitter_java::LANGUAGE.into())
.expect("failed to set language");
parser
}
#[test]
fn test_extract_public_class() {
let source = r#"public class HelloWorld {
public void greet() {
System.out.println("Hello");
}
}
"#;
let mut parser = make_parser();
let tree = parser.parse(source, None).expect("parse failed");
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let classes: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Class)
.collect();
assert!(!classes.is_empty(), "expected class symbol");
assert_eq!(classes[0].name, "HelloWorld");
assert_eq!(classes[0].visibility, Visibility::Public);
let exported: Vec<_> = result
.exports
.iter()
.filter(|e| e.name == "HelloWorld")
.collect();
assert!(!exported.is_empty(), "HelloWorld should be exported");
}
#[test]
fn test_extract_import() {
let source = r#"import java.util.List;
import java.util.HashMap;
"#;
let mut parser = make_parser();
let tree = parser.parse(source, None).expect("parse failed");
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
assert_eq!(result.imports.len(), 2);
let names: Vec<&str> = result
.imports
.iter()
.flat_map(|i| i.names.iter().map(|n| n.as_str()))
.collect();
assert!(
names.contains(&"List"),
"expected List import, got: {:?}",
names
);
assert!(
names.contains(&"HashMap"),
"expected HashMap import, got: {:?}",
names
);
}
#[test]
fn test_extract_method_visibility() {
let source = r#"public class Foo {
public void publicMethod() {}
private void privateMethod() {}
}
"#;
let mut parser = make_parser();
let tree = parser.parse(source, None).expect("parse failed");
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let methods: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Method)
.collect();
assert_eq!(methods.len(), 2);
let pub_method = methods
.iter()
.find(|m| m.name == "publicMethod")
.expect("publicMethod not found");
assert_eq!(pub_method.visibility, Visibility::Public);
let priv_method = methods
.iter()
.find(|m| m.name == "privateMethod")
.expect("privateMethod not found");
assert_eq!(priv_method.visibility, Visibility::Private);
}
#[test]
fn test_extract_interface() {
let source = "public interface Runnable {\n void run();\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let interfaces: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Interface)
.collect();
assert!(!interfaces.is_empty(), "expected interface symbol");
assert_eq!(interfaces[0].name, "Runnable");
assert_eq!(interfaces[0].visibility, Visibility::Public);
}
#[test]
fn test_extract_enum() {
let source = "public enum Status {\n ACTIVE,\n INACTIVE\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let enums: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Enum)
.collect();
assert!(!enums.is_empty(), "expected enum symbol");
assert_eq!(enums[0].name, "Status");
assert_eq!(enums[0].visibility, Visibility::Public);
}
#[test]
fn test_extract_constructor() {
let source = "public class Foo {\n public Foo(int x) {\n this.x = x;\n }\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let constructors: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Method && s.name == "Foo")
.collect();
assert!(!constructors.is_empty(), "expected constructor");
}
#[test]
fn test_extract_inner_class() {
let source = "public class Outer {\n public class Inner {\n public void doWork() {}\n }\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let classes: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Class)
.collect();
assert!(classes.len() >= 2, "expected Outer and Inner classes");
}
#[test]
fn test_extract_wildcard_import() {
let source = "import java.util.*;\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
assert_eq!(result.imports.len(), 1);
assert!(result.imports[0].names.contains(&"*".to_string()));
assert_eq!(result.imports[0].source, "java.util");
}
#[test]
fn test_extract_abstract_class() {
let source = "public abstract class Shape {\n public abstract double area();\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let classes: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Class)
.collect();
assert!(!classes.is_empty());
assert_eq!(classes[0].name, "Shape");
assert_eq!(classes[0].visibility, Visibility::Public);
}
#[test]
fn test_extract_private_class() {
let source = "class PackagePrivate {\n void method() {}\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let classes: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Class)
.collect();
assert!(!classes.is_empty());
assert_eq!(classes[0].visibility, Visibility::Private);
assert!(result.exports.iter().all(|e| e.name != "PackagePrivate"));
}
#[test]
fn test_empty_source() {
let source = "";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
assert!(result.symbols.is_empty());
assert!(result.imports.is_empty());
assert!(result.exports.is_empty());
}
#[test]
fn test_extract_static_method() {
let source = "public class App {\n public static void main(String[] args) {}\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let methods: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Method && s.name == "main")
.collect();
assert!(!methods.is_empty(), "expected main method");
assert_eq!(methods[0].visibility, Visibility::Public);
}
#[test]
fn test_interface_method_no_body() {
let source = "public interface Comparable {\n int compareTo(Object o);\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let _ = result;
}
#[test]
fn test_abstract_method() {
let source = "public abstract class Shape {\n public abstract double area();\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let _ = result;
}
#[test]
fn test_extract_name_fallback() {
let source = "public class App {\n static {}\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let _ = result;
}
#[test]
fn test_wildcard_import() {
let source = "import java.util.*;\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
if !result.imports.is_empty() {
assert!(result.imports[0].names.contains(&"*".to_string()));
}
}
#[test]
fn test_bare_import_no_package() {
let source = "import Foo;\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
if !result.imports.is_empty() {
assert!(result.imports[0].source.is_empty());
assert!(result.imports[0].names.contains(&"Foo".to_string()));
}
}
#[test]
fn test_package_private_class() {
let source = "class Internal {\n void helper() {}\n}\n";
let mut parser = make_parser();
let tree = parser.parse(source, None).unwrap();
let lang = JavaLanguage;
let result = lang.extract(source, &tree);
let classes: Vec<_> = result
.symbols
.iter()
.filter(|s| s.kind == SymbolKind::Class)
.collect();
assert!(!classes.is_empty());
assert_eq!(classes[0].visibility, Visibility::Private);
}
}