use super::CParser;
use crate::io::format::format_utc_timestamp;
use crate::parsing::NodeTracker;
use crate::types::FileId;
use std::collections::{HashMap, HashSet};
use thiserror::Error;
use tree_sitter::Parser;
#[derive(Error, Debug)]
pub enum AuditError {
#[error("Failed to read file: {0}")]
FileRead(#[from] std::io::Error),
#[error("Failed to set language: {0}")]
LanguageSetup(String),
#[error("Failed to parse code")]
ParseFailure,
#[error("Failed to create parser: {0}")]
ParserCreation(String),
}
pub struct CParserAudit {
pub grammar_nodes: HashMap<String, u16>,
pub implemented_nodes: HashSet<String>,
pub extracted_symbol_kinds: HashSet<String>,
}
impl CParserAudit {
pub fn audit_file(file_path: &str) -> Result<Self, AuditError> {
let code = std::fs::read_to_string(file_path)?;
Self::audit_code(&code)
}
pub fn audit_code(code: &str) -> Result<Self, AuditError> {
let mut parser = Parser::new();
let language = tree_sitter_c::LANGUAGE.into();
parser
.set_language(&language)
.map_err(|e| AuditError::LanguageSetup(e.to_string()))?;
let tree = parser.parse(code, None).ok_or(AuditError::ParseFailure)?;
let mut grammar_nodes = HashMap::new();
discover_nodes(tree.root_node(), &mut grammar_nodes);
let mut c_parser = CParser::new().map_err(|e| AuditError::ParserCreation(e.to_string()))?;
let mut symbol_counter = crate::types::SymbolCounter::new();
let file_id = FileId::new(1).unwrap();
let symbols = c_parser.parse(code, file_id, &mut symbol_counter);
let mut extracted_symbol_kinds = HashSet::new();
for symbol in &symbols {
extracted_symbol_kinds.insert(format!("{:?}", symbol.kind));
}
let implemented_nodes: HashSet<String> = c_parser
.get_handled_nodes()
.iter()
.map(|handled_node| handled_node.name.clone())
.collect();
Ok(CParserAudit {
grammar_nodes,
implemented_nodes,
extracted_symbol_kinds,
})
}
pub fn coverage_percentage(&self) -> f64 {
if self.grammar_nodes.is_empty() {
return 0.0;
}
let total = self.grammar_nodes.len();
let implemented = self.implemented_nodes.len();
(implemented as f64 / total as f64) * 100.0
}
pub fn generate_report(&self) -> String {
let mut report = String::new();
report.push_str("# C Parser Coverage Report\n\n");
report.push_str(&format!("*Generated: {}*\n\n", format_utc_timestamp()));
let key_nodes = vec![
"translation_unit",
"function_definition",
"declaration",
"struct_specifier",
"union_specifier",
"enum_specifier",
"typedef_declaration",
"init_declarator",
"parameter_declaration",
"field_declaration",
"enumerator",
"macro_definition",
"preproc_include",
"compound_statement",
"if_statement",
"while_statement",
"for_statement",
"do_statement",
"switch_statement",
"case_statement",
"expression_statement",
];
let key_implemented = key_nodes
.iter()
.filter(|n| self.implemented_nodes.contains(**n))
.count();
report.push_str("## Summary\n");
report.push_str(&format!(
"- Key nodes: {}/{} ({}%)\n",
key_implemented,
key_nodes.len(),
(key_implemented * 100) / key_nodes.len()
));
report.push_str(&format!(
"- Symbol kinds extracted: {}\n",
self.extracted_symbol_kinds.len()
));
report.push_str(
"\n> **Note:** Key nodes are symbol-producing constructs (functions, structs, typedefs).\n\n",
);
report.push_str("## Coverage Table\n\n");
report.push_str("| Node Type | ID | Status |\n");
report.push_str("|-----------|-----|--------|\n");
let mut gaps = Vec::new();
let mut missing = Vec::new();
for node_name in &key_nodes {
let status = if let Some(id) = self.grammar_nodes.get(*node_name) {
if self.implemented_nodes.contains(*node_name) {
format!("{id} | ✅ implemented")
} else {
gaps.push(node_name);
format!("{id} | ⚠️ gap")
}
} else {
missing.push(node_name);
"- | ❌ not found".to_string()
};
report.push_str(&format!("| {node_name} | {status} |\n"));
}
report.push_str("\n## Legend\n\n");
report
.push_str("- ✅ **implemented**: Node type is recognized and handled by the parser\n");
report.push_str("- ⚠️ **gap**: Node type exists in the grammar but not handled by parser (needs implementation)\n");
report.push_str("- ❌ **not found**: Node type not present in the example file (may need better examples)\n");
report.push_str("\n## Recommended Actions\n\n");
if !gaps.is_empty() {
report.push_str("### Priority 1: Implementation Gaps\n");
report.push_str("These nodes exist in your code but aren't being captured:\n\n");
for gap in &gaps {
report.push_str(&format!("- `{gap}`: Add parsing logic in parser.rs\n"));
}
report.push('\n');
}
if !missing.is_empty() {
report.push_str("### Priority 2: Missing Examples\n");
report.push_str("These nodes aren't in the comprehensive example. Consider:\n\n");
for node in &missing {
report.push_str(&format!(
"- `{node}`: Add example to comprehensive.c or verify node name\n"
));
}
report.push('\n');
}
if gaps.is_empty() && missing.is_empty() {
report.push_str("✨ **Excellent coverage!** All key nodes are implemented.\n");
}
report
}
}
fn discover_nodes(node: tree_sitter::Node, registry: &mut HashMap<String, u16>) {
registry.insert(node.kind().to_string(), node.kind_id());
let mut cursor = node.walk();
for child in node.children(&mut cursor) {
discover_nodes(child, registry);
}
}