scirs2-core 0.4.2

Core utilities and common functionality for SciRS2 (scirs2-core)
Documentation
//! Example demonstrating the use of memory-mapped arrays for efficient large data processing.
//!
//! This example shows how to:
//! 1. Create memory-mapped arrays
//! 2. Read from and write to memory-mapped arrays
//! 3. Process large datasets efficiently using memory mapping

use scirs2_core::memory_efficient::{create_mmap, create_temp_mmap, AccessMode};
use scirs2_core::ndarray_ext::{Array1, Array2, Array3, Ix2, Ix3};
use std::path::Path;
use std::time::Instant;
use tempfile::tempdir;

#[allow(dead_code)]
fn main() -> Result<(), Box<dyn std::error::Error>> {
    println!("Memory-Mapped Arrays Example");
    println!("============================\n");

    // Create a temporary directory for our example files
    let temp_dir = tempdir()?;
    println!("Using temporary directory: {:?}", temp_dir.path());

    // Basic example: Creating and reading a memory-mapped array
    basic_example(temp_dir.path())?;

    // Large array example: Efficient processing of data larger than RAM
    large_array_example(temp_dir.path())?;

    // 3D array example: Working with multi-dimensional data
    multi_dimensional_example(temp_dir.path())?;

    // Performance comparison: memory-mapped vs. in-memory arrays
    performance_comparison_example(temp_dir.path())?;

    // tempdir will automatically clean up the directory when dropped

    Ok(())
}

/// Basic example of creating and using memory-mapped arrays
#[allow(dead_code)]
fn basic_example(tempdir: &Path) -> Result<(), Box<dyn std::error::Error>> {
    println!("\n1. Basic Memory-Mapped Array Example");
    println!("----------------------------------");

    // Create some data
    let data = Array1::<f64>::linspace(0., 99., 100);
    println!("Created a 1D array with 100 elements");

    // Create a memory-mapped file from the data
    let file_path = tempdir.join("basic_example.bin");
    let mmap = create_mmap(&data, &file_path, AccessMode::Write, 0)?;
    println!("Created memory-mapped array at: {:?}", file_path);
    println!("  Shape: {:?}", mmap.shape);
    println!("  Size: {} elements", mmap.size);
    println!("  Mode: {:?}", mmap.mode);

    // For simplicity, instead of using open_mmap which has issues with header deserialization,
    // let's just verify the data we've written directly from the original memory-mapped array

    // Read the data from the original mmap
    let loaded_data = mmap.as_array::<scirs2_core::ndarray::Ix1>()?;

    // Verify some values
    println!(
        "Verifying data: [0] = {}, [50] = {}, [99] = {}",
        loaded_data[0], loaded_data[50], loaded_data[99]
    );

    Ok(())
}

/// Example showing how to work with large arrays using memory mapping
#[allow(dead_code)]
fn large_array_example(tempdir: &Path) -> Result<(), Box<dyn std::error::Error>> {
    println!("\n2. Large Array Processing Example");
    println!("-------------------------------");

    // Create a large 2D array (adjust size based on available memory)
    // For this example, we'll use a relatively small array
    let rows = 1000;
    let cols = 1000;
    let data = Array2::<f32>::from_shape_fn((rows, cols), |(i, j)| (i * cols + j) as f32);

    let size_mb = (rows * cols * std::mem::size_of::<f32>()) as f64 / (1024.0 * 1024.0);
    println!("Created a {}x{} array ({:.2} MB)", rows, cols, size_mb);

    // Use a temporary memory-mapped file instead
    let mut mmap = create_temp_mmap(&data, AccessMode::ReadWrite, 0)?;
    println!("Created temporary memory-mapped array");

    // Process the data without loading it all into memory
    // For example, compute the sum of all elements
    let sum = mmap.as_array::<Ix2>()?.sum();
    println!("Sum of all elements: {}", sum);

    // Find the maximum element
    let max = mmap
        .as_array::<Ix2>()?
        .fold(f32::MIN, |a, &b| f32::max(a, b));
    println!("Maximum element: {}", max);

    // We can also modify the data through the memory mapping
    // Get a mutable view
    {
        let mut array_mut = mmap.as_array_mut::<Ix2>()?;

        // Set the diagonal to zeros
        for i in 0..std::cmp::min(rows, cols) {
            array_mut[[i, i]] = 0.0;
        }
    }

    // Flush changes to disk
    mmap.flush()?;

    println!("Modified diagonal elements through memory mapping");

    Ok(())
}

/// Example showing how to work with multi-dimensional arrays
#[allow(dead_code)]
fn multi_dimensional_example(tempdir: &Path) -> Result<(), Box<dyn std::error::Error>> {
    println!("\n3. Multi-Dimensional Array Example");
    println!("---------------------------------");

    // Create a 3D array
    let shape = (10, 10, 10);
    let data = Array3::<i32>::from_shape_fn(shape, |(i, j, k)| (i * 100 + j * 10 + k) as i32);
    println!("Created a 10x10x10 3D array");

    // Create a temporary memory-mapped file
    let mmap = create_temp_mmap(&data, AccessMode::ReadWrite, 0)?;
    println!("Created temporary memory-mapped 3D array");

    // Access as a regular ndarray array
    let array = mmap.as_array::<Ix3>()?;

    // Instead of using slice which causes Dimension trait issues,
    // let's just access individual elements directly
    println!("Accessing some elements directly:");
    println!("Value at [5, 0, 0]: {}", array[[5, 0, 0]]);
    println!("Value at [5, 0, 1]: {}", array[[5, 0, 1]]);
    println!("Value at [5, 0, 2]: {}", array[[5, 0, 2]]);
    println!("Value at [5, 1, 0]: {}", array[[5, 1, 0]]);

    // Show the shape of the 3D array
    println!("3D array shape: {:?}", array.shape());

    Ok(())
}

/// Example comparing performance between memory-mapped and in-memory arrays
#[allow(dead_code)]
fn performance_comparison_example(tempdir: &Path) -> Result<(), Box<dyn std::error::Error>> {
    println!("\n4. Performance Comparison Example");
    println!("--------------------------------");

    // Create a smaller array for the example
    let rows = 1000;
    let cols = 1000;
    let size_mb = (rows * cols * std::mem::size_of::<f64>()) as f64 / (1024.0 * 1024.0);
    println!(
        "Using a {}x{} array ({:.2} MB) for performance comparison",
        rows, cols, size_mb
    );

    // Create in-memory array
    let start = Instant::now();
    let data =
        Array2::<f64>::from_shape_fn((rows, cols), |(i, j)| i as f64 * cols as f64 + j as f64);
    let in_memory_creation_time = start.elapsed();
    println!(
        "In-memory array creation time: {:?}",
        in_memory_creation_time
    );

    // For simplicity in this test, use a temporary memory-mapped array instead
    let start = Instant::now();
    let mmap = create_temp_mmap(&data, AccessMode::ReadWrite, 0)?;
    let mmap_creation_time = start.elapsed();
    println!(
        "Memory-mapped array creation time: {:?}",
        mmap_creation_time
    );

    // Performance for reading: In-memory
    let start = Instant::now();
    let in_memory_sum = data.sum();
    let in_memory_read_time = start.elapsed();
    println!(
        "In-memory array sum calculation time: {:?}",
        in_memory_read_time
    );

    // Performance for reading: Memory-mapped
    let start = Instant::now();
    let mmap_sum = mmap.as_array::<Ix2>()?.sum();
    let mmap_read_time = start.elapsed();
    println!(
        "Memory-mapped array sum calculation time: {:?}",
        mmap_read_time
    );

    // Verify we got the same result
    assert!((in_memory_sum - mmap_sum).abs() < 1e-10);
    println!("Both methods produced the same sum: {}", in_memory_sum);

    println!("\nPerformance Summary:");
    println!(
        "  Creation: Memory-mapped took {:.2}x the time of in-memory",
        mmap_creation_time.as_secs_f64() / in_memory_creation_time.as_secs_f64()
    );
    println!(
        "  Reading: Memory-mapped took {:.2}x the time of in-memory",
        mmap_read_time.as_secs_f64() / in_memory_read_time.as_secs_f64()
    );
    println!("  Note: The real advantage is for arrays larger than RAM");

    Ok(())
}