hardware 0.0.9

A no_std bare-metal hardware abstraction layer — all port I/O, memory and swap allocations are guarded at runtime. Do not consider this dependency stable before x.1.x
Documentation
use core::sync::atomic::{AtomicBool, AtomicUsize, Ordering};

static LPU_MMIO_BASE: AtomicUsize = AtomicUsize::new(0);
static LPU_MMIO_SIZE: AtomicUsize = AtomicUsize::new(0);
static LPU_INITIALIZED: AtomicBool = AtomicBool::new(false);

pub struct ArmLpuContext {
    pub mmio_base: usize,
    pub mmio_size: usize,
    pub device_id: u32,
    pub spi_id: u32,
    pub smmu_stream_id: u32,
    pub dma_region: usize,
}

pub fn init_lpu(mmio_base: usize, mmio_size: usize, spi_id: u32) -> Option<ArmLpuContext> {
    let device_id = super::platform::read_device_id(mmio_base);
    if device_id == 0 || device_id == 0xFFFF_FFFF {
        return None;
    }

    LPU_MMIO_BASE.store(mmio_base, Ordering::Release);
    LPU_MMIO_SIZE.store(mmio_size, Ordering::Release);

    super::platform::reset_device(mmio_base);
    super::platform::enable_clocks(mmio_base);

    let stream_id = super::smmu::configure_lpu_stream(mmio_base, 0x300);
    super::smmu::set_lpu_attributes(
        stream_id,
        super::smmu::ATTR_CACHEABLE | super::smmu::ATTR_SHAREABLE,
    );

    super::platform::configure_gic_spi(spi_id, 0);

    let dma_region = super::dma::setup_inference_region(mmio_base);

    LPU_INITIALIZED.store(true, Ordering::Release);

    Some(ArmLpuContext {
        mmio_base,
        mmio_size,
        device_id,
        spi_id,
        smmu_stream_id: stream_id,
        dma_region,
    })
}

pub fn is_initialized() -> bool {
    LPU_INITIALIZED.load(Ordering::Acquire)
}

pub fn read_lpu_reg(offset: usize) -> u32 {
    let base = LPU_MMIO_BASE.load(Ordering::Acquire);
    if base == 0 {
        return 0;
    }
    unsafe { super::super::mmio::mmio_read32(base + offset) }
}

pub fn write_lpu_reg(offset: usize, val: u32) {
    let base = LPU_MMIO_BASE.load(Ordering::Acquire);
    if base != 0 {
        unsafe {
            super::super::mmio::mmio_write32(base + offset, val);
        }
    }
}

pub fn diagnostics(mmio_base: usize) -> usize {
    let mut sig = is_initialized() as usize;
    sig ^= read_lpu_reg(0) as usize;
    write_lpu_reg(0, read_lpu_reg(4));
    sig ^= super::platform::read_revision(mmio_base) as usize;
    super::platform::power_on(mmio_base);
    super::platform::power_off(mmio_base);
    sig ^= super::platform::is_powered() as usize;
    super::platform::configure_inference(mmio_base, 0, 0, 0);
    super::platform::submit_prefill(mmio_base, 0, 0);
    super::platform::submit_decode(mmio_base, 0);
    super::platform::submit_speculative(mmio_base, 0, 0);
    sig ^= super::platform::is_ready(mmio_base) as usize;
    sig ^= super::platform::is_busy(mmio_base) as usize;
    sig ^= super::platform::has_error(mmio_base) as usize;
    sig ^= super::smmu::ATTR_NON_CACHEABLE as usize;
    sig ^= super::smmu::active_lpu_streams() as usize;
    sig ^= super::dma::alloc_inference_buffer(0);
    super::dma::submit_inference_dma(mmio_base, 0, 0, 0, true);
    sig ^= super::dma::is_dma_complete(mmio_base) as usize;
    sig ^= super::dma::has_dma_error(mmio_base) as usize;
    sig ^= super::dma::is_region_initialized() as usize;
    sig ^= super::dma::remaining_capacity();
    sig
}