wain-exec 0.3.0

WebAssembly syntax tree executor for wain project
Documentation
use crate::globals::Globals;
use crate::trap::{Result, Trap, TrapReason};
use crate::value::LittleEndian;
use std::any;
use std::mem::size_of;
use wain_ast as ast;

const PAGE_SIZE: usize = 65536; // 64Ki
const MAX_MEMORY_BYTES: usize = u32::MAX as usize; // Address space of Wasm is 32bits

// Memory instance
//
// Note: It is more efficient to implement memory buffer by memory mapped buffer. However there is
// no way to use mmap without unsafe.
pub struct Memory {
    max: Option<u32>,
    data: Vec<u8>,
}

impl Memory {
    // https://webassembly.github.io/spec/core/exec/modules.html#alloc-mem
    pub fn allocate(memories: &[ast::Memory]) -> Result<Self> {
        // Note: Only one memory exists thanks to validation
        assert!(memories.len() <= 1);
        if let Some(memory) = memories.get(0) {
            if let Some(i) = &memory.import {
                Err(Trap::unknown_import(i, "memory", memory.start))
            } else {
                let (min, max) = match &memory.ty.limit {
                    ast::Limits::Range(min, max) => (*min, Some(*max)),
                    ast::Limits::From(min) => (*min, None),
                };
                let data = if min == 0 {
                    vec![]
                } else {
                    let len = (min as usize) * PAGE_SIZE;
                    vec![0; len]
                };
                Ok(Self { max, data })
            }
        } else {
            // When no table is set use dummy empty table
            Ok(Self {
                max: Some(0),
                data: vec![],
            })
        }
    }

    // 10. and 14. https://webassembly.github.io/spec/core/exec/modules.html#instantiation
    pub fn new_data(&mut self, segment: &ast::DataSegment, globals: &Globals) -> Result<()> {
        // By validation of constant expression, at least one instruction in the sequence is guaranteed
        // and type must be i32
        let offset = match &segment.offset[segment.offset.len() - 1].kind {
            ast::InsnKind::GlobalGet(idx) => globals.get(*idx),
            ast::InsnKind::I32Const(i) => *i,
            _ => unreachable!("unexpected instruction for element offset"),
        };
        let offset = offset as usize;
        let data = &segment.data;
        let end_addr = offset + data.len();

        if let Some(max) = self.max {
            let max = max as usize;
            if end_addr > max * PAGE_SIZE {
                return Err(Trap::new(
                    TrapReason::OutOfLimit {
                        max,
                        idx: end_addr,
                        kind: "data element",
                    },
                    segment.start,
                ));
            }
        }

        if self.data.len() < end_addr {
            return Err(Trap::new(
                TrapReason::DataSegmentOutOfBuffer {
                    segment_end: end_addr,
                    buffer_size: self.data.len(),
                },
                segment.start,
            ));
        }

        // TODO: copy_from_slice is slower here. I need to investigate the reason
        #[allow(clippy::manual_memcpy)]
        {
            for i in 0..data.len() {
                self.data[offset + i] = data[i];
            }
        }

        Ok(())
    }

    pub fn size(&self) -> u32 {
        (self.data.len() / PAGE_SIZE) as u32
    }

    pub fn grow(&mut self, num_pages: u32) -> i32 {
        // https://webassembly.github.io/spec/core/exec/instructions.html#exec-memory-grow
        let prev = self.size();
        let next = prev + num_pages;
        if let Some(max) = self.max {
            if next > max {
                return -1;
            }
        }
        let next_len = (next as usize) * PAGE_SIZE;
        if next_len > MAX_MEMORY_BYTES {
            // Note: WebAssembly spec does not limit max size of memory when no limit is specified
            // to memory section. However, an address value is u32. When memory size is larger than
            // UINT32_MAX, there is no way to refer it (except for using static offset value).
            // And memory_grow.wast expects allocating more than 2^32 - 1 to fail.
            return -1;
        }
        self.data.resize(next_len, 0);
        prev as i32
    }

    fn check_addr<V: LittleEndian>(
        &self,
        addr: usize,
        at: usize,
        operation: &'static str,
    ) -> Result<()> {
        if addr.saturating_add(size_of::<V>()) > self.data.len() {
            Err(Trap::new(
                TrapReason::LoadMemoryOutOfRange {
                    max: self.data.len(),
                    addr,
                    operation,
                    ty: any::type_name::<V>(),
                },
                at,
            ))
        } else {
            Ok(())
        }
    }

    // https://webassembly.github.io/spec/core/exec/instructions.html#and
    pub fn load<V: LittleEndian>(&self, addr: usize, at: usize) -> Result<V> {
        self.check_addr::<V>(addr, at, "load")?;
        Ok(LittleEndian::read(&self.data, addr))
    }

    // https://webassembly.github.io/spec/core/exec/instructions.html#and
    pub fn store<V: LittleEndian>(&mut self, addr: usize, v: V, at: usize) -> Result<()> {
        self.check_addr::<V>(addr, at, "store")?;
        LittleEndian::write(&mut self.data, addr, v);
        Ok(())
    }

    pub fn data(&self) -> &'_ [u8] {
        &self.data
    }

    pub fn data_mut(&mut self) -> &mut [u8] {
        &mut self.data
    }
}