perl_parser/lib.rs
1//! # perl-parser — Production-grade Perl parser and Language Server Protocol engine
2//!
3//! A comprehensive Perl parser built on recursive descent principles, providing robust AST
4//! generation, LSP feature providers, workspace indexing, and test-driven development support.
5//!
6//! ## Key Features
7//!
8//! - **Tree-sitter Compatible**: AST with kinds, fields, and position tracking compatible with tree-sitter grammar
9//! - **Comprehensive Parsing**: ~100% edge case coverage for Perl 5.8-5.40 syntax
10//! - **LSP Integration**: Full Language Server Protocol feature set (100% compliance, LSP 3.18)
11//! - **TDD Workflow**: Intelligent test generation with return value analysis
12//! - **Incremental Parsing**: Efficient re-parsing for real-time editing
13//! - **Error Recovery**: Graceful handling of malformed input with detailed diagnostics
14//! - **Workspace Navigation**: Cross-file symbol resolution and reference tracking
15//!
16//! ## Quick Start
17//!
18//! ### Basic Parsing
19//!
20//! ```rust
21//! use perl_parser::Parser;
22//!
23//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
24//! let code = r#"sub hello { print "Hello, world!\n"; }"#;
25//! let mut parser = Parser::new(code);
26//!
27//! match parser.parse() {
28//! Ok(ast) => {
29//! println!("AST: {}", ast.to_sexp());
30//! println!("Parsed {} nodes", ast.count_nodes());
31//! }
32//! Err(e) => eprintln!("Parse error: {}", e),
33//! }
34//! # Ok(())
35//! # }
36//! ```
37//!
38//! ### Test-Driven Development
39//!
40//! Generate tests automatically from parsed code:
41//!
42//! ```rust
43//! use perl_parser::Parser;
44//! use perl_parser::tdd::test_generator::{TestGenerator, TestFramework};
45//!
46//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
47//! let code = r#"sub add { my ($a, $b) = @_; return $a + $b; }"#;
48//! let mut parser = Parser::new(code);
49//! let ast = parser.parse()?;
50//!
51//! let generator = TestGenerator::new(TestFramework::TestMore);
52//! let tests = generator.generate_tests(&ast, code);
53//!
54//! // Returns test cases with intelligent assertions
55//! assert!(!tests.is_empty());
56//! # Ok(())
57//! # }
58//! ```
59//!
60//! ### LSP Integration
61//!
62//! Use as a library for LSP features (see `perl-lsp` for the standalone server):
63//!
64//! ```rust
65//! use perl_parser::Parser;
66//! use perl_parser::analysis::semantic::SemanticAnalyzer;
67//!
68//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
69//! let code = "my $x = 42;";
70//! let mut parser = Parser::new(code);
71//! let ast = parser.parse()?;
72//!
73//! // Semantic analysis for hover, completion, etc.
74//! let model = SemanticAnalyzer::analyze(&ast);
75//! # Ok(())
76//! # }
77//! ```
78//!
79//! ## Architecture
80//!
81//! The parser is organized into distinct layers for maintainability and testability:
82//!
83//! ### Core Engine ([`engine`])
84//!
85//! - **[`parser`]**: Recursive descent parser with operator precedence
86//! - **[`ast`]**: Abstract Syntax Tree definitions and node types
87//! - **[`error`]**: Error classification, recovery strategies, and diagnostics
88//! - **[`position`]**: UTF-16 position mapping for LSP protocol compliance
89//! - **[`quote_parser`]**: Specialized parser for quote-like operators
90//! - **[`heredoc_collector`]**: FIFO heredoc collection with indent stripping
91//!
92//! ### IDE Integration (LSP Provider Crates)
93//!
94//! LSP provider modules were removed from `perl-parser` as part of #4414 (microcrate
95//! collapse, PR #0). Import directly from the provider crates:
96//!
97//! - `perl_lsp_completion` — context-aware completion providers
98//! - `perl_lsp_diagnostics` — diagnostics generation and formatting
99//! - `perl_lsp_navigation` — references, document links, type definitions, workspace symbols
100//! - `perl_lsp_rename` — rename providers with validation
101//! - `perl_lsp_semantic_tokens` — semantic token generation
102//! - `perl_lsp_inlay_hints` — inlay hint providers
103//! - `perl_lsp_code_actions` — code action providers
104//!
105//! ### Analysis ([`analysis`])
106//!
107//! - **[`scope_analyzer`]**: Variable and subroutine scoping resolution
108//! - **[`type_inference`]**: Perl type inference engine
109//! - **[`semantic`]**: Semantic model with hover information
110//! - **[`symbol`]**: Symbol table and reference tracking
111//! - **[`dead_code_detector`]**: Unused code detection
112//!
113//! ### Workspace ([`workspace`])
114//!
115//! - **[`workspace_index`]**: Cross-file symbol indexing
116//! - **[`workspace_rename`]**: Multi-file refactoring
117//! - **[`document_store`]**: Document state management
118//!
119//! ### Refactoring ([`refactor`])
120//!
121//! - **[`refactoring`]**: Unified refactoring engine
122//! - **[`modernize`]**: Code modernization utilities
123//! - **[`import_optimizer`]**: Import statement analysis and optimization
124//!
125//! ### Test Support ([`tdd`])
126//!
127//! - **[`test_generator`]**: Intelligent test case generation
128//! - **[`test_runner`]**: Test execution and validation
129//! - **`tdd_workflow`** *(test-only)*: TDD cycle management and coverage tracking
130//!
131//! ## LSP Feature Support
132//!
133//! This crate provides the engine for LSP features. The public standalone server is in
134//! `perllsp`, backed by the `perl-lsp-rs` implementation crate.
135//!
136//! ### Implemented Features
137//!
138//! - **Completion**: Context-aware code completion with type inference
139//! - **Hover**: Documentation and type information on hover
140//! - **Definition**: Go-to-definition with cross-file support
141//! - **References**: Find all references with workspace indexing
142//! - **Rename**: Symbol renaming with conflict detection
143//! - **Diagnostics**: Syntax errors and semantic warnings
144//! - **Formatting**: Code formatting via perltidy integration
145//! - **Folding**: Code folding for blocks and regions
146//! - **Semantic Tokens**: Fine-grained syntax highlighting
147//! - **Call Hierarchy**: Function call navigation
148//! - **Type Hierarchy**: Class inheritance navigation
149//!
150//! See `docs/reference/LSP_CAPABILITY_POLICY.md` for the complete capability matrix.
151//!
152//! ## Incremental Parsing
153//!
154//! Enable efficient re-parsing for real-time editing:
155//!
156//! ```rust,ignore
157//! use perl_parser::{IncrementalState, apply_edits, Edit};
158//!
159//! # fn main() -> Result<(), Box<dyn std::error::Error>> {
160//! let mut state = IncrementalState::new("my $x = 1;");
161//! let ast = state.parse()?;
162//!
163//! // Apply an edit
164//! let edit = Edit {
165//! start_byte: 3,
166//! old_end_byte: 5,
167//! new_end_byte: 5,
168//! text: "$y".to_string(),
169//! };
170//! apply_edits(&mut state, vec![edit]);
171//!
172//! // Incremental re-parse reuses unchanged nodes
173//! let new_ast = state.parse()?;
174//! # Ok(())
175//! # }
176//! ```
177//!
178//! ## Error Recovery
179//!
180//! The parser uses intelligent error recovery to continue parsing after errors:
181//!
182//! ```rust
183//! use perl_parser::Parser;
184//!
185//! let code = "sub broken { if ("; // Incomplete code
186//! let mut parser = Parser::new(code);
187//!
188//! // Parser recovers and builds partial AST
189//! let result = parser.parse();
190//! assert!(result.is_ok());
191//!
192//! // Check recorded errors
193//! let errors = parser.errors();
194//! assert!(!errors.is_empty());
195//! ```
196//!
197//! ## Workspace Indexing
198//!
199//! Build cross-file indexes for workspace-wide navigation:
200//!
201//! ```rust,ignore
202//! use perl_parser::workspace_index::WorkspaceIndex;
203//!
204//! let mut index = WorkspaceIndex::new();
205//! index.index_file("lib/Foo.pm", "package Foo; sub bar { }");
206//! index.index_file("lib/Baz.pm", "use Foo; Foo::bar();");
207//!
208//! // Find all references to Foo::bar
209//! let refs = index.find_references("Foo::bar");
210//! ```
211//!
212//! ## Testing with perl-corpus
213//!
214//! The parser is tested against the comprehensive `perl-corpus` test suite:
215//!
216//! ```bash
217//! # Run parser tests with full corpus coverage
218//! cargo test -p perl-parser
219//!
220//! # Run specific test category
221//! cargo test -p perl-parser --test regex_tests
222//!
223//! # Validate documentation examples
224//! cargo test --doc
225//! ```
226//!
227//! ## Command-Line Tools
228//!
229//! Build and install the LSP server binary:
230//!
231//! ```bash
232//! # Build LSP server
233//! cargo build -p perllsp --release
234//!
235//! # Install globally
236//! cargo install --path crates/perllsp
237//!
238//! # Run LSP server
239//! perllsp --stdio
240//!
241//! # Check server health
242//! perllsp --health
243//! ```
244//!
245//! ## Integration Examples
246//!
247//! ### VSCode Extension
248//!
249//! Configure the LSP server in VSCode settings:
250//!
251//! ```json
252//! {
253//! "perl.lsp.path": "/path/to/perllsp",
254//! "perl.lsp.args": ["--stdio"]
255//! }
256//! ```
257//!
258//! ### Neovim Integration
259//!
260//! ```lua
261//! require'lspconfig'.perl.setup{
262//! cmd = { "/path/to/perllsp", "--stdio" },
263//! }
264//! ```
265//!
266//! ## Performance Characteristics
267//!
268//! - **Single-pass parsing**: O(n) complexity for well-formed input
269//! - **UTF-16 mapping**: Fast bidirectional offset conversion for LSP
270//! - **Incremental updates**: Reuses unchanged AST nodes for efficiency
271//! - **Memory efficiency**: Streaming token processing with bounded lookahead
272//!
273//! ## Compatibility
274//!
275//! - **Perl Versions**: 5.8 through 5.40 (covers 99% of CPAN)
276//! - **LSP Protocol**: LSP 3.18 specification
277//! - **Tree-sitter**: Compatible AST format and position tracking
278//! - **UTF-16**: Full Unicode support with correct LSP position mapping
279//!
280//! ## Related Crates
281//!
282//! - `perllsp`: Public Cargo entry point for the standalone LSP server
283//! - `perl-lsp-rs`: Standalone LSP server runtime implementation (moved from this crate)
284//! - `perl-lexer`: Context-aware Perl tokenizer
285//! - `perl-corpus`: Comprehensive test corpus and generators
286//! - `perl-dap`: Debug Adapter Protocol implementation
287//!
288//! ## Documentation
289//!
290//! - **API Docs**: See module documentation below
291//! - **LSP Guide**: `docs/reference/LSP_IMPLEMENTATION_GUIDE.md`
292//! - **Capability Policy**: `docs/reference/LSP_CAPABILITY_POLICY.md`
293//! - **Commands**: `docs/reference/COMMANDS_REFERENCE.md`
294//! - **Current Status**: `docs/project/CURRENT_STATUS.md`
295
296#![deny(unsafe_code)]
297#![deny(unreachable_pub)] // prevent stray pub items from escaping
298#![warn(rust_2018_idioms)]
299// NOTE: missing_docs enabled with baseline enforcement (Issue #197)
300// Baseline enforced via ci/missing_docs_baseline.txt
301#![warn(missing_docs)]
302#![allow(
303 // Core allows for parser/lexer code
304 clippy::too_many_lines,
305 clippy::module_name_repetitions,
306 clippy::cast_possible_truncation,
307 clippy::cast_sign_loss,
308 clippy::cast_precision_loss,
309 clippy::cast_possible_wrap,
310 clippy::must_use_candidate,
311 clippy::missing_errors_doc,
312 clippy::missing_panics_doc,
313
314 // Parser-specific patterns that are fine
315 clippy::wildcard_imports,
316 clippy::enum_glob_use,
317 clippy::match_same_arms,
318 clippy::if_not_else,
319 clippy::struct_excessive_bools,
320 clippy::items_after_statements,
321 clippy::return_self_not_must_use,
322 clippy::unused_self,
323 clippy::collapsible_match,
324 clippy::collapsible_if,
325 clippy::only_used_in_recursion,
326 clippy::items_after_test_module,
327 clippy::while_let_loop,
328 clippy::single_range_in_vec_init,
329 clippy::arc_with_non_send_sync,
330 clippy::needless_range_loop,
331 clippy::result_large_err,
332 clippy::if_same_then_else,
333 clippy::should_implement_trait,
334 clippy::manual_flatten,
335
336 // String handling in parsers
337 clippy::needless_raw_string_hashes,
338 clippy::single_char_pattern,
339 clippy::uninlined_format_args
340)]
341//! ## Architecture
342//!
343//! The parser follows a recursive descent design with operator precedence handling,
344//! maintaining a clean separation from the lexing phase. This modular approach
345//! enables:
346//!
347//! - Independent testing of parsing logic
348//! - Easy integration with different lexer implementations
349//! - Clear error boundaries between lexing and parsing phases
350//! - Optimal performance through single-pass parsing
351//!
352//! ## Example
353//!
354//! ```rust
355//! use perl_parser::Parser;
356//!
357//! let code = "my $x = 42;";
358//! let mut parser = Parser::new(code);
359//!
360//! match parser.parse() {
361//! Ok(ast) => println!("AST: {}", ast.to_sexp()),
362//! Err(e) => eprintln!("Parse error: {}", e),
363//! }
364//! ```
365
366/// Parser engine components and supporting utilities.
367pub mod engine;
368/// Legacy module aliases for moved engine components.
369pub use engine::{error, parser, position};
370
371/// Recursive descent Perl parser with error recovery and AST generation.
372pub use core::{Node, NodeKind, ParseError, ParseOutput, ParseResult, Parser, SourceLocation};
373/// Abstract Syntax Tree (AST) definitions for Perl parsing.
374pub use engine::ast;
375/// Experimental second-generation AST (work in progress).
376pub use engine::ast_v2;
377/// Edit tracking for incremental parsing.
378pub use engine::edit;
379/// Heredoc content collector with FIFO ordering and indent stripping.
380pub use engine::heredoc_collector;
381/// Parser context with error recovery support.
382pub use engine::parser_context;
383/// Pragma tracking for `use` and related directives.
384pub use engine::pragma_tracker;
385/// Parser for Perl quote and quote-like operators.
386pub use engine::quote_parser;
387#[cfg(not(target_arch = "wasm32"))]
388/// Error classification and recovery strategies for parse failures.
389pub use error::classifier as error_classifier;
390/// Error recovery strategies for resilient parsing.
391pub use error::recovery as error_recovery;
392/// Parser utilities and helpers.
393pub use perl_parser_core::util;
394
395/// Line-to-byte offset index for fast position lookups.
396pub use perl_parser_core::line_index;
397/// Line ending detection and UTF-16 position mapping for LSP compliance.
398pub use position::{LineEnding, PositionMapper};
399
400/// Facade over `perl-semantic-analyzer` for compatibility imports.
401pub mod analysis;
402/// Perl builtin function signatures and metadata.
403pub mod builtins;
404/// Facade over parser-kernel types from `perl-parser-core`.
405pub mod core;
406#[cfg(feature = "incremental")]
407/// Incremental parsing for efficient re-parsing during editing.
408pub mod incremental;
409/// Canonical convenience imports for consumers.
410pub mod prelude;
411/// Code refactoring, modernization, and import optimization.
412pub mod refactor;
413/// Test-driven development support and test generation.
414pub mod tdd;
415/// Token stream, trivia, and token wrapper utilities.
416pub mod tokens;
417/// Facade over `perl-workspace` for compatibility imports.
418pub mod workspace;
419
420pub mod compat;
421
422// =============================================================================
423// Wave D absorbed satellite crates (as internal modules)
424// =============================================================================
425
426/// AST range and insertion helpers for Perl LSP features (previously `perl-ast-utils`).
427pub mod ast_utils;
428/// Anti-pattern detection for problematic Perl heredoc patterns (previously `perl-heredoc-anti-patterns`).
429// Wave D: allow missing_docs — original crate had an explicit exception per CLAUDE.md
430#[allow(missing_docs)]
431pub mod heredoc_anti_patterns;
432/// Secure workspace-relative path normalization (previously `perl-path-normalize`; from perl-parser-core).
433pub use perl_parser_core::path_normalize;
434/// Workspace-bound path validation and traversal prevention (previously `perl-path-security`; from perl-parser-core).
435pub use perl_parser_core::path_security;
436/// Nearest-rank percentile helpers for integer latency samples (previously `perl-percentile`; from perl-parser-core).
437pub use perl_parser_core::percentile;
438/// Perl qualified-name parsing, splitting, and validation helpers (previously `perl-qualified-name`; from perl-parser-core).
439pub use perl_parser_core::qualified_name;
440/// Shared Perl source-file classification helpers (previously `perl-source-file`; from perl-parser-core).
441pub use perl_parser_core::source_file;
442/// Text-line cursor and boundary helpers (previously `perl-text-line`; from perl-parser-core).
443pub use perl_parser_core::text_line;
444
445/// Variable and subroutine declaration analysis.
446pub use analysis::declaration;
447#[cfg(not(target_arch = "wasm32"))]
448/// File and symbol indexing for workspace-wide navigation.
449pub use analysis::index;
450/// Scope analysis for variable and subroutine resolution.
451pub use analysis::scope_analyzer;
452/// Semantic model with hover information and token classification.
453pub use analysis::semantic;
454/// Symbol table, extraction, and reference tracking.
455pub use analysis::symbol;
456/// Type inference engine for Perl variable analysis.
457pub use analysis::type_inference;
458/// Builtin function signature lookup tables.
459pub use builtins::builtin_signatures;
460/// Perfect hash function (PHF) based builtin signature lookup.
461pub use builtins::builtin_signatures_phf;
462/// Dead code detection for Perl workspaces (absorbed from `perl-dead-code`).
463#[cfg(not(target_arch = "wasm32"))]
464pub mod dead_code;
465/// Backwards-compatibility alias: `perl_parser::dead_code_detector` still works.
466#[cfg(not(target_arch = "wasm32"))]
467pub use dead_code as dead_code_detector;
468
469/// Import statement analysis and optimization.
470pub use refactor::import_optimizer;
471/// Code modernization utilities for Perl best practices.
472pub use refactor::modernize;
473/// Enhanced code modernization with refactoring capabilities.
474pub use refactor::modernize_refactored;
475/// Unified refactoring engine for comprehensive code transformations.
476pub use refactor::refactoring;
477/// Token stream with position-aware iteration.
478pub use tokens::token_stream;
479/// Lightweight token wrapper for AST integration.
480pub use tokens::token_wrapper;
481/// Trivia (whitespace and comments) representation.
482pub use tokens::trivia;
483/// Parser that preserves trivia tokens for formatting.
484pub use tokens::trivia_parser;
485
486#[cfg(feature = "incremental")]
487/// Advanced AST node reuse strategies for incremental parsing.
488pub use incremental::incremental_advanced_reuse;
489#[cfg(feature = "incremental")]
490/// Checkpoint-based incremental parsing with rollback support.
491pub use incremental::incremental_checkpoint;
492#[cfg(feature = "incremental")]
493/// Document-level incremental parsing state management.
494pub use incremental::incremental_document;
495#[cfg(feature = "incremental")]
496/// Edit representation and application for incremental updates.
497pub use incremental::incremental_edit;
498#[cfg(feature = "incremental")]
499#[deprecated(note = "LSP server moved to perl-lsp; perl-parser no longer handles didChange")]
500/// Legacy incremental handler (deprecated, use `perl-lsp` crate instead).
501pub use incremental::incremental_handler_v2;
502#[cfg(feature = "incremental")]
503/// Integration layer connecting incremental parsing with the full parser.
504pub use incremental::incremental_integration;
505#[cfg(feature = "incremental")]
506/// Simplified incremental parsing interface for common use cases.
507pub use incremental::incremental_simple;
508#[cfg(feature = "incremental")]
509/// Second-generation incremental parsing with improved node reuse.
510pub use incremental::incremental_v2;
511
512/// Basic TDD utilities and test helpers.
513pub use tdd::tdd_basic;
514#[cfg(test)]
515/// TDD workflow integration for Test-Driven Development support.
516pub use tdd::tdd_workflow;
517/// Intelligent test case generation from parsed Perl code.
518pub use tdd::test_generator;
519/// Test execution and TDD support functionality.
520pub use tdd::test_runner;
521
522/// In-memory document storage for open editor buffers.
523pub use workspace::document_store;
524/// Cross-file symbol index for workspace-wide navigation.
525pub use workspace::workspace_index;
526#[cfg(not(target_arch = "wasm32"))]
527/// Multi-file refactoring operations across a workspace.
528pub use workspace::workspace_refactor;
529/// Cross-file symbol renaming with conflict detection.
530pub use workspace::workspace_rename;
531
532/// AST node, node kind enum, and source location types.
533/// Parse error and result types for parser output.
534pub use error::{RecoverySalvageClass, RecoverySalvageProfile};
535#[cfg(feature = "incremental")]
536/// Checkpointed incremental parser with simple edit tracking.
537pub use incremental_checkpoint::{CheckpointedIncrementalParser, SimpleEdit};
538/// Pragma state tracking for `use strict`, `use warnings`, etc.
539pub use pragma_tracker::{PragmaState, PragmaTracker};
540/// Token types and token stream for lexer output.
541pub use token_stream::{Token, TokenKind, TokenStream};
542/// Trivia (whitespace/comments) attached to AST nodes.
543pub use trivia::{NodeWithTrivia, Trivia, TriviaToken};
544/// Trivia-preserving parser and formatting utilities.
545pub use trivia_parser::{TriviaPreservingParser, format_with_trivia};
546
547// Incremental parsing exports (feature-gated)
548#[cfg(feature = "incremental")]
549/// Core incremental parsing types: edit representation, state, and application.
550pub use incremental::{Edit, IncrementalState, apply_edits};
551
552/// Semantic analysis types for hover, tokens, and code understanding.
553pub use semantic::{
554 HoverInfo, SemanticAnalyzer, SemanticModel, SemanticToken, SemanticTokenModifier,
555 SemanticTokenType,
556};
557/// Symbol extraction, table, and reference types for navigation.
558pub use symbol::{Symbol, SymbolExtractor, SymbolKind, SymbolReference, SymbolTable};
559
560// =============================================================================
561// LSP Feature Exports (DEPRECATED - migrated to perl-lsp crate)
562// =============================================================================
563// These exports are commented out during the migration period.
564// Use `perl_lsp` crate for LSP functionality instead.
565//
566// pub use code_actions::{CodeAction, CodeActionEdit, CodeActionKind, CodeActionsProvider};
567// pub use code_actions_enhanced::EnhancedCodeActionsProvider;
568// pub use code_actions_provider::{...};
569// pub use code_lens_provider::{CodeLens, CodeLensProvider, ...};
570// pub use completion::{CompletionContext, CompletionItem, CompletionItemKind, CompletionProvider};
571// pub use diagnostics::{Diagnostic, DiagnosticSeverity, DiagnosticTag, ...};
572// pub use document_links::compute_links;
573// pub use folding::{FoldingRange, FoldingRangeExtractor, FoldingRangeKind};
574// pub use formatting::{CodeFormatter, FormatTextEdit, FormattingOptions};
575// pub use inlay_hints::{parameter_hints, trivial_type_hints};
576// pub use lsp::protocol::{JsonRpcError, JsonRpcRequest, JsonRpcResponse};
577// pub use lsp_server::LspServer;
578// pub use on_type_formatting::compute_on_type_edit;
579// pub use rename::{RenameOptions, RenameProvider, RenameResult, TextEdit, apply_rename_edits};
580// pub use selection_range::{build_parent_map, selection_chain};
581// pub use semantic_tokens::{...};
582// pub use semantic_tokens_provider::{...};
583// pub use signature_help::{ParameterInfo, SignatureHelp, SignatureHelpProvider, SignatureInfo};
584// pub use workspace_symbols::{WorkspaceSymbol, WorkspaceSymbolsProvider};
585// =============================================================================
586
587/// Import analysis, optimization, and unused import detection.
588pub use import_optimizer::{
589 DuplicateImport, ImportAnalysis, ImportEntry, ImportOptimizer, MissingImport,
590 OrganizationSuggestion, SuggestionPriority, UnusedImport,
591};
592/// Scope analysis issue types and analyzer.
593pub use scope_analyzer::{IssueKind, ScopeAnalyzer, ScopeIssue};
594#[cfg(test)]
595/// Test generation, coverage reporting, and refactoring suggestions.
596pub use test_generator::{
597 CoverageReport, Priority, RefactoringCategory, RefactoringSuggester, RefactoringSuggestion,
598 TestCase, TestFramework, TestGenerator, TestGeneratorOptions, TestResults, TestRunner,
599};
600/// Type inference types: Perl types, constraints, and inference engine.
601pub use type_inference::{
602 PerlType, ScalarType, TypeBasedCompletion, TypeConstraint, TypeEnvironment,
603 TypeInferenceEngine, TypeLocation,
604};
605
606/// Refactoring engine types: configuration, operations, and results.
607pub use refactoring::{
608 ModernizationPattern, RefactoringConfig, RefactoringEngine, RefactoringOperation,
609 RefactoringResult, RefactoringScope, RefactoringType,
610};
611#[cfg(test)]
612/// TDD workflow types: actions, configuration, and cycle management.
613pub use tdd_workflow::{
614 AnnotationSeverity, CoverageAnnotation, TddAction, TddConfig, TddCycleResult, TddWorkflow,
615 TestType, WorkflowState, WorkflowStatus,
616};
617
618#[cfg(test)]
619mod tests {
620 use super::*;
621 use perl_tdd_support::must;
622
623 #[test]
624 fn test_basic_parsing() {
625 let mut parser = Parser::new("my $x = 42;");
626 let result = parser.parse();
627 assert!(result.is_ok());
628
629 let ast = must(result);
630 assert!(matches!(ast.kind, NodeKind::Program { .. }));
631 }
632
633 #[test]
634 fn test_variable_declaration() {
635 let cases = vec![
636 ("my $x;", "my"),
637 ("our $y;", "our"),
638 ("local $z;", "local"),
639 ("state $w;", "state"),
640 ];
641
642 for (code, declarator) in cases {
643 let mut parser = Parser::new(code);
644 let result = parser.parse();
645 assert!(result.is_ok(), "Failed to parse: {}", code);
646
647 let ast = must(result);
648 if let NodeKind::Program { statements } = &ast.kind {
649 assert_eq!(statements.len(), 1);
650 let is_var_decl =
651 matches!(statements[0].kind, NodeKind::VariableDeclaration { .. });
652 assert!(is_var_decl, "Expected VariableDeclaration for: {}", code);
653 if let NodeKind::VariableDeclaration { declarator: decl, .. } = &statements[0].kind
654 {
655 assert_eq!(decl, declarator);
656 }
657 }
658 }
659 }
660
661 #[test]
662 fn test_operators() {
663 // Test operators that work correctly
664 let cases = vec![
665 ("$a + $b", "+"),
666 ("$a - $b", "-"),
667 ("$a * $b", "*"),
668 ("$a . $b", "."),
669 ("$a && $b", "&&"),
670 ("$a || $b", "||"),
671 ];
672
673 for (code, expected_op) in cases {
674 let mut parser = Parser::new(code);
675 let result = parser.parse();
676 assert!(result.is_ok(), "Failed to parse: {}", code);
677
678 let ast = must(result);
679 if let NodeKind::Program { statements } = &ast.kind {
680 assert!(!statements.is_empty(), "No statements found in AST for: {}", code);
681
682 // Find the binary node, which might be wrapped in an ExpressionStatement
683 let binary_node = match &statements[0].kind {
684 NodeKind::ExpressionStatement { expression } => match &expression.kind {
685 NodeKind::Binary { op, left, right } => Some((op, left, right)),
686 _ => None,
687 },
688 NodeKind::Binary { op, left, right } => Some((op, left, right)),
689 _ => None,
690 };
691
692 assert!(
693 binary_node.is_some(),
694 "Expected Binary operator for: {}. Found: {:?}",
695 code,
696 statements[0].kind
697 );
698 if let Some((op, left, right)) = binary_node {
699 assert_eq!(op, expected_op, "Operator mismatch for: {}", code);
700
701 // Additional diagnostic information
702 println!("Parsing: {}", code);
703 println!("Left node: {:?}", left);
704 println!("Right node: {:?}", right);
705 }
706 }
707 assert!(
708 matches!(ast.kind, NodeKind::Program { .. }),
709 "Expected Program node, found: {:?}",
710 ast.kind
711 );
712 }
713 }
714
715 #[test]
716 fn test_operators_with_context() {
717 // These operators require context-aware parsing to disambiguate from similar syntax:
718 // - `/` could be division or regex delimiter
719 // - `%` could be modulo or hash sigil
720 // - `**` could be exponent or glob pattern
721 // - `//` could be defined-or or regex delimiter
722 // The lexer handles disambiguation via LexerMode::ExpectTerm tracking.
723 let cases: Vec<(&str, &str)> = vec![
724 ("2 / 3", "/"), // Division (not regex)
725 ("$a % $b", "%"), // Modulo (not hash sigil)
726 ("$a ** $b", "**"), // Exponent (not glob)
727 ("$a // $b", "//"), // Defined-or (not regex)
728 ];
729
730 for (code, expected_op) in cases {
731 let mut parser = Parser::new(code);
732 let result = parser.parse();
733 assert!(result.is_ok(), "Failed to parse: {}", code);
734
735 let ast = must(result);
736 if let NodeKind::Program { statements } = &ast.kind {
737 assert!(!statements.is_empty(), "No statements found in AST for: {}", code);
738
739 // Find the binary node, which might be wrapped in an ExpressionStatement
740 let binary_node = match &statements[0].kind {
741 NodeKind::ExpressionStatement { expression } => match &expression.kind {
742 NodeKind::Binary { op, .. } => Some(op),
743 _ => None,
744 },
745 NodeKind::Binary { op, .. } => Some(op),
746 _ => None,
747 };
748
749 assert!(
750 binary_node.is_some(),
751 "Expected Binary operator for: {}. Found: {:?}",
752 code,
753 statements[0].kind
754 );
755 if let Some(op) = binary_node {
756 assert_eq!(op, expected_op, "Operator mismatch for: {}", code);
757 }
758 }
759 assert!(
760 matches!(ast.kind, NodeKind::Program { .. }),
761 "Expected Program node, found: {:?}",
762 ast.kind
763 );
764 }
765 }
766
767 #[test]
768 fn test_string_literals() {
769 let cases = vec![r#""hello""#, r#"'world'"#, r#"qq{foo}"#, r#"q{bar}"#];
770
771 for code in cases {
772 let mut parser = Parser::new(code);
773 let result = parser.parse();
774 assert!(result.is_ok(), "Failed to parse: {}", code);
775 }
776 }
777
778 #[test]
779 fn test_arrays_and_hashes() {
780 let cases = vec![
781 "@array",
782 "%hash",
783 "$array[0]",
784 "$hash{key}",
785 "@array[1, 2, 3]",
786 "@hash{'a', 'b'}",
787 ];
788
789 for code in cases {
790 let mut parser = Parser::new(code);
791 let result = parser.parse();
792 assert!(result.is_ok(), "Failed to parse: {}", code);
793 }
794 }
795
796 #[test]
797 fn test_subroutines() {
798 let cases = vec![
799 "sub foo { }",
800 "sub bar { return 42; }",
801 "sub baz ($x, $y) { $x + $y }",
802 "sub qux :method { }",
803 ];
804
805 for code in cases {
806 let mut parser = Parser::new(code);
807 let result = parser.parse();
808 assert!(result.is_ok(), "Failed to parse: {}", code);
809
810 let ast = must(result);
811 if let NodeKind::Program { statements } = &ast.kind {
812 assert_eq!(statements.len(), 1);
813 assert!(matches!(statements[0].kind, NodeKind::Subroutine { .. }));
814 }
815 }
816 }
817
818 #[test]
819 fn test_control_flow() {
820 let cases = vec![
821 "if ($x) { }",
822 "if ($x) { } else { }",
823 "if ($x) { } elsif ($y) { } else { }",
824 "unless ($x) { }",
825 "while ($x) { }",
826 "until ($x) { }",
827 "for (my $i = 0; $i < 10; $i++) { }",
828 "foreach my $x (@array) { }",
829 ];
830
831 for code in cases {
832 let mut parser = Parser::new(code);
833 let result = parser.parse();
834 assert!(result.is_ok(), "Failed to parse: {}", code);
835 }
836 }
837
838 #[test]
839 fn test_regex() {
840 let cases = vec![
841 "/pattern/",
842 "m/pattern/",
843 "s/old/new/",
844 "tr/a-z/A-Z/",
845 r#"qr/\d+/"#,
846 "$x =~ /foo/",
847 "$x !~ /bar/",
848 ];
849
850 for code in cases {
851 let mut parser = Parser::new(code);
852 let result = parser.parse();
853 assert!(result.is_ok(), "Failed to parse: {}", code);
854 }
855 }
856
857 #[test]
858 fn test_error_cases() {
859 let cases = vec![
860 ("if (", "Unexpected end of input"),
861 ("sub (", "Unexpected end of input"),
862 ("my (", "Unexpected end of input"),
863 ("{", "Unexpected end of input"),
864 ];
865
866 for (code, _expected_error) in cases {
867 let mut parser = Parser::new(code);
868 let result = parser.parse();
869
870 // With error recovery, parse() succeeds but collects errors
871 assert!(result.is_ok(), "Parser should recover from errors for: {}", code);
872
873 // Check that errors were recorded
874 let errors = parser.errors();
875 assert!(!errors.is_empty(), "Expected recorded errors for: {}", code);
876 }
877 }
878
879 #[test]
880 fn test_modern_perl_features() {
881 let cases = vec![
882 "class Point { }",
883 "method new { }",
884 "try { } catch ($e) { }",
885 "defer { }",
886 "my $x :shared = 42;",
887 ];
888
889 for code in cases {
890 let mut parser = Parser::new(code);
891 let result = parser.parse();
892 assert!(result.is_ok(), "Failed to parse: {}", code);
893 }
894 }
895
896 #[test]
897 fn test_edge_cases() {
898 let cases = vec![
899 // Indirect object syntax
900 "print STDOUT 'hello';",
901 "new Class;",
902 // Multi-variable declarations
903 "my ($x, $y) = (1, 2);",
904 "my ($a :shared, $b :locked);",
905 // Complex expressions
906 "$x->@*",
907 "$x->%*",
908 "$x->$*",
909 // Defined-or
910 "$x // 'default'",
911 // ISA operator
912 "$obj ISA 'Class'",
913 ];
914
915 for code in cases {
916 let mut parser = Parser::new(code);
917 let result = parser.parse();
918 assert!(result.is_ok(), "Failed to parse edge case: {}", code);
919 }
920 }
921}