zfs 0.1.0 - Docs.rs

use std::collections::{HashMap, VecDeque};

use super::dvaddr::DVAddr;
use super::zio;
use super::djb2::Djb2;
use std::hash::BuildHasherDefault;

/// MRU - Most Recently Used cache
struct Mru {
    map: HashMap<DVAddr, Vec<u8>, BuildHasherDefault<Djb2>>,
    /// Oldest DVAddrs are at the end
    queue: VecDeque<DVAddr>, 
    /// Max mru cache size in blocks
    size: usize,
    /// Number of used blocks in mru cache
    used: usize,
}

impl Mru {
    pub fn new() -> Self {
        Mru {
            map: HashMap::with_hasher(Default::default()),
            queue: VecDeque::new(),
            size: 1000,
            used: 0,
        }
    }

    pub fn cache_block(&mut self, dva: &DVAddr, block: Vec<u8>) -> Result<Vec<u8>, &str> {
        // If necessary, make room for the block in the cache
        while self.used + (dva.asize() as usize) > self.size {
            let last_dva = match self.queue.pop_back() {
                Some(dva) => dva,
                None => return Err("No more ARC MRU items to free"),
            };
            self.map.remove(&last_dva);
            self.used -= last_dva.asize() as usize;
        }

        // Add the block to the cache
        self.used += dva.asize() as usize;
        self.map.insert(*dva, block);
        self.queue.push_front(*dva);
        Ok(self.map.get(dva).unwrap().clone())
    }
}

/// MFU - Most Frequently Used cache
struct Mfu {
    // TODO: Keep track of use counts. So mfu_map becomes (use_count: u64, Vec<u8>). Reset the use
    // count every once in a while. For instance, every 1000 reads. This will probably end up being
    // a knob for the user.
    // TODO: Keep track of minimum frequency and corresponding DVA
    map: HashMap<DVAddr, (u64, Vec<u8>), BuildHasherDefault<Djb2>>,
    size: usize, // Max mfu cache size in blocks
    used: usize, // Number of used bytes in mfu cache
}

impl Mfu {
    pub fn new() -> Self {
        Mfu {
            map: HashMap::with_hasher(Default::default()),
            size: 1000,
            used: 0,
        }
    }

    pub fn cache_block(&mut self, dva: &DVAddr, block: Vec<u8>) -> Result<&[u8], &str> {
        {
            let mut lowest_freq = !0;
            let mut lowest_dva  = Err("No valid DVA found.");

            for (&dva_key, &(freq, _)) in self.map.iter() {
                if freq < lowest_freq {
                    lowest_freq = freq;
                    lowest_dva = Ok(dva_key);
                }
            }

            self.map.remove(&try!(lowest_dva));
        }

        // Add the block to the cache
        self.used += dva.asize() as usize;
        self.map.insert(*dva, (2, block));
        Ok(&self.map.get(dva).unwrap().1)
    }
}

/// Our implementation of the Adaptive Replacement Cache (ARC) is set up to allocate
/// its buffer on the heap rather than in a private pool thing. This makes it much
/// simpler to implement, but defers the fragmentation problem to the heap allocator.
/// We named the type `ArCache` to avoid confusion with Rust's `Arc` reference type.
pub struct ArCache {
    mru: Mru,
    mfu: Mfu,
}

impl ArCache {
    pub fn new() -> Self {
        ArCache {
            mru: Mru::new(),
            mfu: Mfu::new(),
        }
    }

    pub fn read(&mut self, reader: &mut zio::Reader, dva: &DVAddr) -> Result<Vec<u8>, &str> {
        if let Some(block) = self.mru.map.remove(dva) {
            self.mfu.map.insert(*dva, (0, block.clone()));

            // Block is cached
            return Ok(block);
        }
        if let Some(block) = self.mfu.map.get_mut(dva) {
            // Block is cached
            if block.0 > 1000 {
                block.0 = 0;
            } else {
                block.0 += 1;
            }

            return Ok(block.1.clone());
        }

        // Block isn't cached, have to read it from disk
        let block = reader.read(dva.sector() as usize, dva.asize() as usize);

        // Blocks start in MRU cache
        self.mru.cache_block(dva, block)
    }
}