Skip to main content

rumdl_lib/rules/
md056_table_column_count.rs

1use crate::rule::{Fix, LintError, LintResult, LintWarning, Rule, Severity};
2use crate::utils::range_utils::calculate_line_range;
3use crate::utils::table_utils::TableUtils;
4
5/// Rule MD056: Table column count
6///
7/// See [docs/md056.md](../../docs/md056.md) for full documentation, configuration, and examples.
8/// Ensures all rows in a table have the same number of cells
9#[derive(Debug, Clone)]
10pub struct MD056TableColumnCount;
11
12impl Default for MD056TableColumnCount {
13    fn default() -> Self {
14        MD056TableColumnCount
15    }
16}
17
18impl MD056TableColumnCount {
19    /// Try to fix a table row content (with list context awareness)
20    fn fix_table_row_content(
21        &self,
22        row_content: &str,
23        expected_count: usize,
24        flavor: crate::config::MarkdownFlavor,
25        table_block: &crate::utils::table_utils::TableBlock,
26        line_index: usize,
27        original_line: &str,
28    ) -> Option<String> {
29        let current_count = TableUtils::count_cells_with_flavor(row_content, flavor);
30
31        if current_count == expected_count || current_count == 0 {
32            return None;
33        }
34
35        let fixed = self.fix_row_by_truncation(row_content, expected_count, flavor)?;
36        Some(self.restore_prefixes(&fixed, table_block, line_index, original_line))
37    }
38
39    /// Restore list/blockquote prefixes to a fixed row
40    fn restore_prefixes(
41        &self,
42        fixed_content: &str,
43        table_block: &crate::utils::table_utils::TableBlock,
44        line_index: usize,
45        original_line: &str,
46    ) -> String {
47        // Extract blockquote prefix from original
48        let (blockquote_prefix, _) = TableUtils::extract_blockquote_prefix(original_line);
49
50        // Handle list context
51        if let Some(ref list_ctx) = table_block.list_context {
52            if line_index == 0 {
53                // Header line: use list prefix
54                format!("{blockquote_prefix}{}{fixed_content}", list_ctx.list_prefix)
55            } else {
56                // Continuation lines: use indentation
57                let indent = " ".repeat(list_ctx.content_indent);
58                format!("{blockquote_prefix}{indent}{fixed_content}")
59            }
60        } else {
61            // No list context, just blockquote
62            if blockquote_prefix.is_empty() {
63                fixed_content.to_string()
64            } else {
65                format!("{blockquote_prefix}{fixed_content}")
66            }
67        }
68    }
69
70    /// Fix a table row by truncating or adding cells
71    fn fix_row_by_truncation(
72        &self,
73        row: &str,
74        expected_count: usize,
75        flavor: crate::config::MarkdownFlavor,
76    ) -> Option<String> {
77        let current_count = TableUtils::count_cells_with_flavor(row, flavor);
78
79        if current_count == expected_count || current_count == 0 {
80            return None;
81        }
82
83        let trimmed = row.trim();
84        let has_leading_pipe = trimmed.starts_with('|');
85        let has_trailing_pipe = trimmed.ends_with('|');
86
87        // Delegate to shared cell splitting (returns only cell contents, no empty leading/trailing parts)
88        let cells = TableUtils::split_table_row_with_flavor(trimmed, flavor);
89        let mut cell_contents: Vec<&str> = cells.iter().map(|c| c.trim()).collect();
90
91        // Adjust cell count to match expected count
92        match current_count.cmp(&expected_count) {
93            std::cmp::Ordering::Greater => {
94                // Too many cells, remove excess
95                cell_contents.truncate(expected_count);
96            }
97            std::cmp::Ordering::Less => {
98                // Too few cells, add empty ones
99                while cell_contents.len() < expected_count {
100                    cell_contents.push("");
101                }
102            }
103            std::cmp::Ordering::Equal => {
104                // Perfect number of cells, no adjustment needed
105            }
106        }
107
108        // Reconstruct row
109        let mut result = String::new();
110        if has_leading_pipe {
111            result.push('|');
112        }
113
114        for (i, cell) in cell_contents.iter().enumerate() {
115            result.push_str(&format!(" {cell} "));
116            if i < cell_contents.len() - 1 || has_trailing_pipe {
117                result.push('|');
118            }
119        }
120
121        Some(result)
122    }
123}
124
125impl Rule for MD056TableColumnCount {
126    fn name(&self) -> &'static str {
127        "MD056"
128    }
129
130    fn description(&self) -> &'static str {
131        "Table column count should be consistent"
132    }
133
134    fn should_skip(&self, ctx: &crate::lint_context::LintContext) -> bool {
135        // Skip if no tables present
136        !ctx.likely_has_tables()
137    }
138
139    fn check(&self, ctx: &crate::lint_context::LintContext) -> LintResult {
140        let content = ctx.content;
141        let flavor = ctx.flavor;
142        let mut warnings = Vec::new();
143
144        // Early return for empty content or content without tables
145        if content.is_empty() || !content.contains('|') {
146            return Ok(Vec::new());
147        }
148
149        let lines = ctx.raw_lines();
150
151        // Use pre-computed table blocks from context
152        let table_blocks = &ctx.table_blocks;
153
154        for table_block in table_blocks {
155            // Collect all table lines for building the whole-table fix
156            let all_line_indices: Vec<usize> = std::iter::once(table_block.header_line)
157                .chain(std::iter::once(table_block.delimiter_line))
158                .chain(table_block.content_lines.iter().copied())
159                .collect();
160
161            // Determine expected column count from header row (strip list/blockquote prefix first)
162            let header_content = TableUtils::extract_table_row_content(lines[table_block.header_line], table_block, 0);
163            let expected_count = TableUtils::count_cells_with_flavor(header_content, flavor);
164
165            if expected_count == 0 {
166                continue; // Skip invalid tables
167            }
168
169            // Build the whole-table fix once for all warnings in this table
170            // This ensures that applying Quick Fix on any row fixes the entire table
171            let table_start_line = table_block.start_line + 1; // Convert to 1-indexed
172            let table_end_line = table_block.end_line + 1; // Convert to 1-indexed
173
174            // Build the complete fixed table content
175            let mut fixed_table_lines: Vec<String> = Vec::with_capacity(all_line_indices.len());
176            for (i, &line_idx) in all_line_indices.iter().enumerate() {
177                let line = lines[line_idx];
178                let row_content = TableUtils::extract_table_row_content(line, table_block, i);
179                let fixed_line = self
180                    .fix_table_row_content(row_content, expected_count, flavor, table_block, i, line)
181                    .unwrap_or_else(|| line.to_string());
182                if line_idx < lines.len() - 1 {
183                    fixed_table_lines.push(format!("{fixed_line}\n"));
184                } else {
185                    fixed_table_lines.push(fixed_line);
186                }
187            }
188            let table_replacement = fixed_table_lines.concat();
189            let table_range = ctx.line_index.multi_line_range(table_start_line, table_end_line);
190
191            // Check all rows in the table
192            for (i, &line_idx) in all_line_indices.iter().enumerate() {
193                let line = lines[line_idx];
194                let row_content = TableUtils::extract_table_row_content(line, table_block, i);
195                let count = TableUtils::count_cells_with_flavor(row_content, flavor);
196
197                if count > 0 && count != expected_count {
198                    // Calculate precise character range for the entire table row
199                    let (start_line, start_col, end_line, end_col) = calculate_line_range(line_idx + 1, line);
200
201                    // Each warning uses the same whole-table fix
202                    // This ensures Quick Fix on any row fixes the entire table
203                    warnings.push(LintWarning {
204                        rule_name: Some(self.name().to_string()),
205                        message: format!("Table row has {count} cells, but expected {expected_count}"),
206                        line: start_line,
207                        column: start_col,
208                        end_line,
209                        end_column: end_col,
210                        severity: Severity::Warning,
211                        fix: Some(Fix {
212                            range: table_range.clone(),
213                            replacement: table_replacement.clone(),
214                        }),
215                    });
216                }
217            }
218        }
219
220        Ok(warnings)
221    }
222
223    fn fix(&self, ctx: &crate::lint_context::LintContext) -> Result<String, LintError> {
224        let content = ctx.content;
225        let flavor = ctx.flavor;
226        let lines = ctx.raw_lines();
227        let table_blocks = &ctx.table_blocks;
228
229        let mut result_lines: Vec<String> = lines.iter().map(|&s| s.to_string()).collect();
230
231        for table_block in table_blocks {
232            // Collect all table lines
233            let all_line_indices: Vec<usize> = std::iter::once(table_block.header_line)
234                .chain(std::iter::once(table_block.delimiter_line))
235                .chain(table_block.content_lines.iter().copied())
236                .collect();
237
238            // Determine expected column count from header row (strip list/blockquote prefix first)
239            let header_content = TableUtils::extract_table_row_content(lines[table_block.header_line], table_block, 0);
240            let expected_count = TableUtils::count_cells_with_flavor(header_content, flavor);
241
242            if expected_count == 0 {
243                continue; // Skip invalid tables
244            }
245
246            // Fix all rows in the table
247            for (i, &line_idx) in all_line_indices.iter().enumerate() {
248                let line = lines[line_idx];
249                let row_content = TableUtils::extract_table_row_content(line, table_block, i);
250                if let Some(fixed_line) =
251                    self.fix_table_row_content(row_content, expected_count, flavor, table_block, i, line)
252                {
253                    result_lines[line_idx] = fixed_line;
254                }
255            }
256        }
257
258        let mut fixed = result_lines.join("\n");
259        // Preserve trailing newline if original content had one
260        if content.ends_with('\n') && !fixed.ends_with('\n') {
261            fixed.push('\n');
262        }
263        Ok(fixed)
264    }
265
266    fn as_any(&self) -> &dyn std::any::Any {
267        self
268    }
269
270    fn from_config(_config: &crate::config::Config) -> Box<dyn Rule>
271    where
272        Self: Sized,
273    {
274        Box::new(MD056TableColumnCount)
275    }
276}
277
278#[cfg(test)]
279mod tests {
280    use super::*;
281    use crate::lint_context::LintContext;
282
283    #[test]
284    fn test_valid_table() {
285        let rule = MD056TableColumnCount;
286        let content = "| Header 1 | Header 2 | Header 3 |
287|----------|----------|----------|
288| Cell 1   | Cell 2   | Cell 3   |
289| Cell 4   | Cell 5   | Cell 6   |";
290        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
291        let result = rule.check(&ctx).unwrap();
292
293        assert_eq!(result.len(), 0);
294    }
295
296    #[test]
297    fn test_too_few_columns() {
298        let rule = MD056TableColumnCount;
299        let content = "| Header 1 | Header 2 | Header 3 |
300|----------|----------|----------|
301| Cell 1   | Cell 2   |
302| Cell 4   | Cell 5   | Cell 6   |";
303        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
304        let result = rule.check(&ctx).unwrap();
305
306        assert_eq!(result.len(), 1);
307        assert_eq!(result[0].line, 3);
308        assert!(result[0].message.contains("has 2 cells, but expected 3"));
309    }
310
311    #[test]
312    fn test_too_many_columns() {
313        let rule = MD056TableColumnCount;
314        let content = "| Header 1 | Header 2 |
315|----------|----------|
316| Cell 1   | Cell 2   | Cell 3   | Cell 4   |
317| Cell 5   | Cell 6   |";
318        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
319        let result = rule.check(&ctx).unwrap();
320
321        assert_eq!(result.len(), 1);
322        assert_eq!(result[0].line, 3);
323        assert!(result[0].message.contains("has 4 cells, but expected 2"));
324    }
325
326    #[test]
327    fn test_delimiter_row_mismatch() {
328        let rule = MD056TableColumnCount;
329        let content = "| Header 1 | Header 2 | Header 3 |
330|----------|----------|
331| Cell 1   | Cell 2   | Cell 3   |";
332        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
333        let result = rule.check(&ctx).unwrap();
334
335        assert_eq!(result.len(), 1);
336        assert_eq!(result[0].line, 2);
337        assert!(result[0].message.contains("has 2 cells, but expected 3"));
338    }
339
340    #[test]
341    fn test_fix_too_few_columns() {
342        let rule = MD056TableColumnCount;
343        let content = "| Header 1 | Header 2 | Header 3 |
344|----------|----------|----------|
345| Cell 1   | Cell 2   |
346| Cell 4   | Cell 5   | Cell 6   |";
347        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
348        let fixed = rule.fix(&ctx).unwrap();
349
350        assert!(fixed.contains("| Cell 1 | Cell 2 |  |"));
351    }
352
353    #[test]
354    fn test_fix_too_many_columns() {
355        let rule = MD056TableColumnCount;
356        let content = "| Header 1 | Header 2 |
357|----------|----------|
358| Cell 1   | Cell 2   | Cell 3   | Cell 4   |
359| Cell 5   | Cell 6   |";
360        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
361        let fixed = rule.fix(&ctx).unwrap();
362
363        assert!(fixed.contains("| Cell 1 | Cell 2 |"));
364        assert!(!fixed.contains("Cell 3"));
365        assert!(!fixed.contains("Cell 4"));
366    }
367
368    #[test]
369    fn test_no_leading_pipe() {
370        let rule = MD056TableColumnCount;
371        let content = "Header 1 | Header 2 | Header 3 |
372---------|----------|----------|
373Cell 1   | Cell 2   |
374Cell 4   | Cell 5   | Cell 6   |";
375        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
376        let result = rule.check(&ctx).unwrap();
377
378        assert_eq!(result.len(), 1);
379        assert_eq!(result[0].line, 3);
380    }
381
382    #[test]
383    fn test_no_trailing_pipe() {
384        let rule = MD056TableColumnCount;
385        let content = "| Header 1 | Header 2 | Header 3
386|----------|----------|----------
387| Cell 1   | Cell 2
388| Cell 4   | Cell 5   | Cell 6";
389        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
390        let result = rule.check(&ctx).unwrap();
391
392        assert_eq!(result.len(), 1);
393        assert_eq!(result[0].line, 3);
394    }
395
396    #[test]
397    fn test_no_pipes_at_all() {
398        let rule = MD056TableColumnCount;
399        let content = "This is not a table
400Just regular text
401No pipes here";
402        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
403        let result = rule.check(&ctx).unwrap();
404
405        assert_eq!(result.len(), 0);
406    }
407
408    #[test]
409    fn test_empty_cells() {
410        let rule = MD056TableColumnCount;
411        let content = "| Header 1 | Header 2 | Header 3 |
412|----------|----------|----------|
413|          |          |          |
414| Cell 1   |          | Cell 3   |";
415        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
416        let result = rule.check(&ctx).unwrap();
417
418        assert_eq!(result.len(), 0);
419    }
420
421    #[test]
422    fn test_multiple_tables() {
423        let rule = MD056TableColumnCount;
424        let content = "| Table 1 Col 1 | Table 1 Col 2 |
425|----------------|----------------|
426| Data 1         | Data 2         |
427
428Some text in between.
429
430| Table 2 Col 1 | Table 2 Col 2 | Table 2 Col 3 |
431|----------------|----------------|----------------|
432| Data 3         | Data 4         |
433| Data 5         | Data 6         | Data 7         |";
434        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
435        let result = rule.check(&ctx).unwrap();
436
437        assert_eq!(result.len(), 1);
438        assert_eq!(result[0].line, 9);
439        assert!(result[0].message.contains("has 2 cells, but expected 3"));
440    }
441
442    #[test]
443    fn test_table_with_escaped_pipes() {
444        let rule = MD056TableColumnCount;
445
446        // Single backslash escapes the pipe: \| keeps pipe as content (2 columns)
447        let content = "| Command | Description |
448|---------|-------------|
449| `echo \\| grep` | Pipe example |
450| `ls` | List files |";
451        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
452        let result = rule.check(&ctx).unwrap();
453        assert_eq!(result.len(), 0, "escaped pipe \\| should not split cells");
454
455        // Double backslash + pipe inside code span: pipe is still masked by code span
456        let content_double = "| Command | Description |
457|---------|-------------|
458| `echo \\\\| grep` | Pipe example |
459| `ls` | List files |";
460        let ctx2 = LintContext::new(content_double, crate::config::MarkdownFlavor::Standard, None);
461        let result2 = rule.check(&ctx2).unwrap();
462        // The \\| is inside backticks, so the pipe is content, not a delimiter
463        assert_eq!(result2.len(), 0, "pipes inside code spans should not split cells");
464    }
465
466    #[test]
467    fn test_empty_content() {
468        let rule = MD056TableColumnCount;
469        let content = "";
470        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
471        let result = rule.check(&ctx).unwrap();
472
473        assert_eq!(result.len(), 0);
474    }
475
476    #[test]
477    fn test_code_block_with_table() {
478        let rule = MD056TableColumnCount;
479        let content = "```
480| This | Is | Code |
481|------|----|----|
482| Not  | A  | Table |
483```
484
485| Real | Table |
486|------|-------|
487| Data | Here  |";
488        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
489        let result = rule.check(&ctx).unwrap();
490
491        // Should not check tables inside code blocks
492        assert_eq!(result.len(), 0);
493    }
494
495    #[test]
496    fn test_fix_preserves_pipe_style() {
497        let rule = MD056TableColumnCount;
498        // Test with no trailing pipes
499        let content = "| Header 1 | Header 2 | Header 3
500|----------|----------|----------
501| Cell 1   | Cell 2";
502        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
503        let fixed = rule.fix(&ctx).unwrap();
504
505        let lines: Vec<&str> = fixed.lines().collect();
506        assert!(!lines[2].ends_with('|'));
507        assert!(lines[2].contains("Cell 1"));
508        assert!(lines[2].contains("Cell 2"));
509    }
510
511    #[test]
512    fn test_single_column_table() {
513        let rule = MD056TableColumnCount;
514        let content = "| Header |
515|---------|
516| Cell 1  |
517| Cell 2  |";
518        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
519        let result = rule.check(&ctx).unwrap();
520
521        assert_eq!(result.len(), 0);
522    }
523
524    #[test]
525    fn test_complex_delimiter_row() {
526        let rule = MD056TableColumnCount;
527        let content = "| Left | Center | Right |
528|:-----|:------:|------:|
529| L    | C      | R     |
530| Left | Center |";
531        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
532        let result = rule.check(&ctx).unwrap();
533
534        assert_eq!(result.len(), 1);
535        assert_eq!(result[0].line, 4);
536    }
537
538    #[test]
539    fn test_unicode_content() {
540        let rule = MD056TableColumnCount;
541        let content = "| 名前 | 年齢 | 都市 |
542|------|------|------|
543| 田中 | 25   | 東京 |
544| 佐藤 | 30   |";
545        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
546        let result = rule.check(&ctx).unwrap();
547
548        assert_eq!(result.len(), 1);
549        assert_eq!(result[0].line, 4);
550    }
551
552    #[test]
553    fn test_very_long_cells() {
554        let rule = MD056TableColumnCount;
555        let content = "| Short | Very very very very very very very very very very long header | Another |
556|-------|--------------------------------------------------------------|---------|
557| Data  | This is an extremely long cell content that goes on and on   |";
558        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
559        let result = rule.check(&ctx).unwrap();
560
561        assert_eq!(result.len(), 1);
562        assert!(result[0].message.contains("has 2 cells, but expected 3"));
563    }
564
565    #[test]
566    fn test_fix_with_newline_ending() {
567        let rule = MD056TableColumnCount;
568        let content = "| A | B | C |
569|---|---|---|
570| 1 | 2 |
571";
572        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
573        let fixed = rule.fix(&ctx).unwrap();
574
575        assert!(fixed.ends_with('\n'));
576        assert!(fixed.contains("| 1 | 2 |  |"));
577    }
578
579    #[test]
580    fn test_fix_without_newline_ending() {
581        let rule = MD056TableColumnCount;
582        let content = "| A | B | C |
583|---|---|---|
584| 1 | 2 |";
585        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
586        let fixed = rule.fix(&ctx).unwrap();
587
588        assert!(!fixed.ends_with('\n'));
589        assert!(fixed.contains("| 1 | 2 |  |"));
590    }
591
592    #[test]
593    fn test_blockquote_table_column_mismatch() {
594        let rule = MD056TableColumnCount;
595        let content = "> | Header 1 | Header 2 | Header 3 |
596> |----------|----------|----------|
597> | Cell 1   | Cell 2   |";
598        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
599        let result = rule.check(&ctx).unwrap();
600
601        assert_eq!(result.len(), 1);
602        assert_eq!(result[0].line, 3);
603        assert!(result[0].message.contains("has 2 cells, but expected 3"));
604    }
605
606    #[test]
607    fn test_fix_blockquote_table_preserves_prefix() {
608        let rule = MD056TableColumnCount;
609        let content = "> | Header 1 | Header 2 | Header 3 |
610> |----------|----------|----------|
611> | Cell 1   | Cell 2   |
612> | Cell 4   | Cell 5   | Cell 6   |";
613        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
614        let fixed = rule.fix(&ctx).unwrap();
615
616        // Each line should still start with "> "
617        for line in fixed.lines() {
618            assert!(line.starts_with("> "), "Line should preserve blockquote prefix: {line}");
619        }
620        // The fixed row should have 3 cells
621        assert!(fixed.contains("> | Cell 1 | Cell 2 |  |"));
622    }
623
624    #[test]
625    fn test_fix_nested_blockquote_table() {
626        let rule = MD056TableColumnCount;
627        let content = ">> | A | B | C |
628>> |---|---|---|
629>> | 1 | 2 |";
630        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
631        let fixed = rule.fix(&ctx).unwrap();
632
633        // Each line should preserve the nested blockquote prefix
634        for line in fixed.lines() {
635            assert!(
636                line.starts_with(">> "),
637                "Line should preserve nested blockquote prefix: {line}"
638            );
639        }
640        assert!(fixed.contains(">> | 1 | 2 |  |"));
641    }
642
643    #[test]
644    fn test_blockquote_table_too_many_columns() {
645        let rule = MD056TableColumnCount;
646        let content = "> | A | B |
647> |---|---|
648> | 1 | 2 | 3 | 4 |";
649        let ctx = LintContext::new(content, crate::config::MarkdownFlavor::Standard, None);
650        let fixed = rule.fix(&ctx).unwrap();
651
652        // Should preserve blockquote prefix while truncating columns
653        assert!(fixed.lines().nth(2).unwrap().starts_with("> "));
654        assert!(fixed.contains("> | 1 | 2 |"));
655        assert!(!fixed.contains("| 3 |"));
656    }
657}