vb6parse 1.0.0

vb6parse is a library for parsing and analyzing VB6 code, from projects, to controls, to modules, and forms.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
//! VB6 Class File Parser Module
//!
//! This module provides functionality to parse VB6 class files (.cls).
//! It defines the `ClassFile` struct representing a VB6 class file,
//! along with methods to parse the file and extract relevant information
//! such as version, properties, and attributes.
//!

pub mod properties;

use std::fmt::Display;

use crate::{
    errors::{ClassError, ParserContext},
    files::{
        class::properties::{
            ClassHeader, ClassProperties, DataBindingBehavior, DataSourceBehavior, FileUsage,
            MtsStatus, Persistence,
        },
        common::{extract_attributes, extract_version},
    },
    io::SourceFile,
    lexer::tokenize,
    parsers::{
        cst::{parse, serialize_cst},
        SyntaxKind,
    },
    ConcreteSyntaxTree, ParseResult,
};

use serde::Serialize;

/// Represents a VB6 class file.
/// A VB6 class file contains a header and a concrete syntax tree.
///
/// The header contains the version, multi use, persistable, data binding behavior,
/// data source behavior, and MTS transaction mode.
/// The header also contains the attributes of the class file.
///
/// The cst contains the concrete syntax tree of the code of the class file.
#[derive(Debug, PartialEq, Eq, Clone, Serialize)]
pub struct ClassFile {
    /// The header of the class file.
    pub header: ClassHeader,
    /// The concrete syntax tree of the class file.
    /// This excludes nodes that are already represented in the header.
    #[serde(serialize_with = "serialize_cst")]
    pub cst: ConcreteSyntaxTree,
}

impl Display for ClassFile {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        write!(f, "VB6 Class File: {}", self.header.attributes.name)
    }
}

impl ClassFile {
    /// Parses a VB6 class file from a byte slice.
    ///
    /// # Arguments
    ///
    /// * `input` The byte slice to parse.
    ///
    /// # Returns
    ///
    /// A result containing the parsed VB6 class file or an error.
    ///
    /// # Errors
    ///
    /// An error will be returned if the input is not a valid VB6 class file.
    ///
    /// # Example
    ///
    /// ```rust
    /// use vb6parse::ClassFile;
    /// use vb6parse::io::SourceFile;
    ///
    /// let input = b"VERSION 1.0 CLASS
    /// BEGIN
    ///   MultiUse = -1  'True
    ///   Persistable = 0  'NotPersistable
    ///   DataBindingBehavior = 0  'vbNone
    ///   DataSourceBehavior = 0  'vbNone
    ///   MTSTransactionMode = 0  'NotAnMTSObject
    /// END
    /// Attribute VB_Name = \"Something\"
    /// Attribute VB_GlobalNameSpace = False
    /// Attribute VB_Creatable = True
    /// Attribute VB_PredeclaredId = False
    /// Attribute VB_Exposed = False
    /// ";
    ///
    /// let result = SourceFile::decode_with_replacement("class_parse.cls", input);
    ///
    /// let source_file = match result {
    ///     Ok(source_file) => source_file,
    ///     Err(e) => panic!("Failed to decode source file 'class_parse.cls': {e:?}"),
    /// };
    ///
    /// let result = ClassFile::parse(&source_file);
    ///
    /// assert!(result.has_result());
    /// ```
    #[must_use]
    pub fn parse(source_file: &SourceFile) -> ParseResult<'_, Self> {
        let mut input = source_file.source_stream();
        let mut ctx = ParserContext::new(input.file_name(), input.contents);

        // Parse tokens and create CST
        let token_stream_result = tokenize(&mut input);
        let (token_stream_opt, token_failures) = token_stream_result.unpack();

        ctx.extend_errors(token_failures);

        let Some(token_stream) = token_stream_opt else {
            return ParseResult::new(None, ctx.into_errors());
        };

        // Parse CST
        let cst = parse(token_stream);

        // Extract version from CST
        let Some(version) = extract_version(&cst) else {
            ctx.error(input.span_here(), ClassError::VersionKeywordMissing);

            return ParseResult::new(None, ctx.into_errors());
        };

        // Extract properties from CST
        let properties = extract_properties(&cst);

        // Extract attributes from CST
        let attributes = extract_attributes(&cst);

        let header = ClassHeader {
            version,
            properties,
            attributes,
        };

        // Filter out nodes that are already extracted to avoid duplication
        // For class files, we remove:
        // - VersionStatement (already in header.version)
        // - PropertiesBlock (BEGIN...END - already in header. properties)
        // - AttributeStatement nodes (already in header.attributes)
        let filtered_cst = cst.without_kinds(&[
            SyntaxKind::VersionStatement,
            SyntaxKind::PropertiesBlock,
            SyntaxKind::AttributeStatement,
        ]);

        ParseResult::new(
            Some(ClassFile {
                header,
                cst: filtered_cst,
            }),
            ctx.into_errors(),
        )
    }
}

/// Extract `VB6ClassProperties` from `PropertiesBlock` nodes in the CST
fn extract_properties(cst: &ConcreteSyntaxTree) -> ClassProperties {
    let mut multi_use = FileUsage::MultiUse;
    let mut persistable = Persistence::NotPersistable;
    let mut data_binding_behavior = DataBindingBehavior::None;
    let mut data_source_behavior = DataSourceBehavior::None;
    let mut mts_transaction_mode = MtsStatus::NotAnMTSObject;

    // Find the PropertiesBlock node
    let properties_blocks: Vec<_> = cst
        .children()
        .into_iter()
        .filter(|c| c.kind() == SyntaxKind::PropertiesBlock)
        .collect();

    if properties_blocks.is_empty() {
        return ClassProperties::default();
    }

    let properties_block = &properties_blocks[0];

    // Find all Property nodes within the PropertiesBlock
    let property_nodes: Vec<_> = properties_block
        .children()
        .iter()
        .filter(|c| c.kind() == SyntaxKind::Property)
        .collect();

    for prop_node in property_nodes {
        let mut key = String::new();
        let mut value = String::new();
        let mut found_equals = false;

        for child in prop_node.children() {
            if !child.is_token() {
                continue;
            }

            match child.kind() {
                SyntaxKind::PropertyKey => {
                    // This is a nested node, get its text
                    if let Some(first_child) = child.children().first() {
                        key = first_child.text().trim().to_string();
                    }
                }
                SyntaxKind::EqualityOperator => {
                    found_equals = true;
                }
                SyntaxKind::PropertyValue => {
                    // This is a nested node, get all its text
                    if found_equals {
                        for val_child in child.children() {
                            if val_child.is_token() {
                                match val_child.kind() {
                                    SyntaxKind::IntegerLiteral | SyntaxKind::LongLiteral => {
                                        value.push_str(val_child.text().trim());
                                    }
                                    SyntaxKind::SubtractionOperator => {
                                        value.push('-');
                                    }
                                    _ => {}
                                }
                            }
                        }
                    }
                }
                _ => {}
            }
        }

        // Process the extracted key-value pair
        if !key.is_empty() && !value.is_empty() {
            match key.as_str() {
                "MultiUse" => {
                    multi_use = if value == "-1" {
                        FileUsage::MultiUse
                    } else {
                        FileUsage::SingleUse
                    };
                }
                "Persistable" => {
                    persistable = if value == "-1" {
                        Persistence::Persistable
                    } else {
                        Persistence::NotPersistable
                    };
                }
                "DataBindingBehavior" => {
                    data_binding_behavior = match value.as_str() {
                        "1" => DataBindingBehavior::Simple,
                        "2" => DataBindingBehavior::Complex,
                        // When in doubt, default to None (0) which is the default VB6 behavior.
                        _ => DataBindingBehavior::None,
                    };
                }
                "DataSourceBehavior" => {
                    data_source_behavior = match value.as_str() {
                        "1" => DataSourceBehavior::DataSource,
                        // When in doubt, default to None (0) which is the default VB6 behavior.
                        _ => DataSourceBehavior::None,
                    };
                }
                "MTSTransactionMode" => {
                    mts_transaction_mode = match value.as_str() {
                        "1" => MtsStatus::NoTransactions,
                        "2" => MtsStatus::RequiresTransaction,
                        "3" => MtsStatus::UsesTransaction,
                        "4" => MtsStatus::RequiresNewTransaction,
                        // When in doubt, default to NotAnMTSObject (0) which is the default VB6 behavior.
                        _ => MtsStatus::NotAnMTSObject,
                    };
                }
                _ => {}
            }
        }
    }

    ClassProperties {
        multi_use,
        persistable,
        data_binding_behavior,
        data_source_behavior,
        mts_transaction_mode,
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::io::SourceFile;

    #[test]
    fn class_file_valid() {
        let class_bytes = r#"VERSION 1.0 CLASS
BEGIN
    MultiUse = -1  'True
    Persistable = 0  'NotPersistable
    DataBindingBehavior = 0  'vbNone
    DataSourceBehavior = 0  'vbNone
    MTSTransactionMode = 0  'NotAnMTSObject
END
Attribute VB_Name = \"Something\"
Attribute VB_GlobalNameSpace = False
Attribute VB_Creatable = True
Attribute VB_PredeclaredId = False
Attribute VB_Exposed = False
Attribute VB_Ext_KEY = \"SavedWithClassBuilder6\" ,\"Yes\"
Attribute VB_Ext_KEY = \"Saved\" ,\"False\"

Option Explicit
"#;

        let result = SourceFile::decode_with_replacement("test.cls", class_bytes.as_bytes());

        let source_file = match result {
            Ok(source_file) => source_file,
            Err(e) => panic!("Failed to decode source file 'test.cls': {e:?}"),
        };

        let result = ClassFile::parse(&source_file);

        if result.has_failures() {
            for failure in result.failures() {
                failure.print();
            }

            panic!("Class parse had failures");
        }

        assert!(result.has_result());
    }

    #[test]
    fn class_file_invalid() {
        // These should be '\r\n', or at worst '\n', but not '\r'.
        // '\r' is not even remotely a valid line ending.
        let class_bytes = b"VERSION 1.0 CLASS\r
                    BEGIN\r
                        MultiUse = -1  'True\r
                        Persistable = 0  'NotPersistable\r
                        DataBindingBehavior = 0  'vbNone\r
                        DataSourceBehavior = 0  'vbNone\r
                        MTSTransactionMode = 0  'NotAnMTSObject\r
                    END\r
                    Attribute VB_Name = \"Something\"\r
                    Attribute VB_GlobalNameSpace = False\r
                    Attribute VB_Creatable = True\r
                    Attribute VB_PredeclaredId = False\r
                    Attribute VB_Exposed = False\r
                    Attribute VB_Description = \"Description text\"\r
                    \r
                    Option Explicit\r";

        let result = SourceFile::decode_with_replacement("test.cls", class_bytes);

        let source_file = match result {
            Ok(source_file) => source_file,
            Err(e) => panic!("Failed to decode source file 'test.cls': {e:?}"),
        };

        let result = ClassFile::parse(&source_file);

        assert!(result.has_failures());
    }

    #[test]
    fn class_header_valid() {
        let input = b"VERSION 1.0 CLASS\r
    BEGIN\r
        MultiUse = -1  'True\r
        Persistable = 0  'NotPersistable\r
        DataBindingBehavior = 0  'vbNone\r
        DataSourceBehavior = 0  'vbNone\r
        MTSTransactionMode = 0  'NotAnMTSObject\r
    END\r
    Attribute VB_Name = \"Something\"\r
    Attribute VB_GlobalNameSpace = False\r
    Attribute VB_Creatable = True\r
    Attribute VB_PredeclaredId = False\r
    Attribute VB_Exposed = False";

        let sourcefile = SourceFile::decode_with_replacement("test.cls", input).unwrap();

        let result = ClassFile::parse(&sourcefile);

        assert!(result.has_result());
    }

    #[test]
    fn version_valid() {
        let class_bytes = b"VERSION 1.0 CLASS\r\n";

        let result = SourceFile::decode_with_replacement("test.cls", class_bytes);

        let source_file = match result {
            Ok(source_file) => source_file,
            Err(e) => panic!("Failed to decode source file 'test.cls': {e:?}"),
        };

        let mut source_stream = source_file.source_stream();
        let token_stream = tokenize(&mut source_stream).unwrap();
        let cst = parse(token_stream);

        let version = extract_version(&cst);

        assert!(version.is_some());
        let version = version.unwrap();
        assert_eq!(version.major, 1);
        assert_eq!(version.minor, 0);
    }

    #[test]
    fn version_invalid() {
        // 'VERSION' isn't correct - this will fail to tokenize properly
        let class_bytes = b"VERION 1.0 CLASS";

        let result = SourceFile::decode_with_replacement("test.cls", class_bytes);

        let source_file = match result {
            Ok(source_file) => source_file,
            Err(e) => panic!("Failed to decode source file 'test.cls': {e:?}"),
        };

        let mut source_stream = source_file.source_stream();
        let token_stream = tokenize(&mut source_stream).unwrap();
        let cst = parse(token_stream);

        let version = extract_version(&cst);

        // Should be None because there's no VERSION keyword
        assert!(version.is_none());
    }
}