1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
use std::sync::Arc;
use std::sync::Mutex;
use std::fs::File;
use std::io::Read;
use std::io::Seek;
use std::io::SeekFrom;
use std::ops::Range;
use std::cmp;
use std::io;

const BUFFERS_COUNT: usize = 3;
const MINIMUM_BUFFER_SIZE: usize = 0x8000;

#[derive(Debug, Clone, PartialEq, Eq)]
pub enum FileViewError {
    IOError,
    EndOfFileError
}

pub struct FileView {
    inner: Arc<Mutex<FileViewInner>>
}

struct FileViewInner {
    file: File,
    buffers: Vec<Arc<FileViewBuffer>>
}

struct FileViewBuffer {
    file_offset: u64,
    data: Vec<u8>
}

pub struct FileViewItem {
    buffer: Arc<FileViewBuffer>,
    buffer_offset: u64,
    len: u64
}

impl FileView {
    pub fn new(file: File) -> Self {
        FileView {
            inner: Arc::new(Mutex::new(FileViewInner {
                file: file,
                buffers: vec!()
            }))
        }
    }

    pub fn len(&self) -> Result<u64, FileViewError> {
        let inner = &mut *self.inner.lock().unwrap();
        Ok(inner.file.metadata()?.len())
    }

    pub fn read(&self, range: Range<u64>) -> Result<FileViewItem, FileViewError> {
        let inner = &mut *self.inner.lock().unwrap();

        let buffer = if let Some(buffer) = inner.get(&range) {
            buffer
        } else {
            // load a new chunk from disk
            inner.file.seek(SeekFrom::Start(range.start))?;
            let mut new_buffer = vec!(0;cmp::max(MINIMUM_BUFFER_SIZE, (range.end - range.start) as usize));
            inner.file.read(&mut new_buffer)?;

            // add it to our buffers
            let file_view_buffer = Arc::new(FileViewBuffer {
                file_offset: range.start,
                data: new_buffer
            });
            if inner.buffers.len() < BUFFERS_COUNT {
                inner.buffers.push(file_view_buffer.clone())
            } else {
                inner.buffers[0] = file_view_buffer.clone()
            }
            file_view_buffer
        };

        if range.end - buffer.file_offset > buffer.data.len() as u64 || range.end > inner.file.metadata()?.len() {
            return Err(FileViewError::EndOfFileError)
        }

        Ok(FileViewItem {
            buffer_offset: range.start - buffer.file_offset,
            buffer: buffer,
            len: range.end - range.start
        })
    }
}

impl FileViewInner {
    fn get(&mut self, range: &Range<u64>) -> Option<Arc<FileViewBuffer>> {
        let len = self.buffers.len();
        let hit_buffer = self.get_buffer(range);
        if let Some((i, buffer)) = hit_buffer {
            if i < len - 1 { // move hot buffer to the right
                self.buffers.swap(i, i + 1);
            }
            Some(buffer)
        } else {
            None
        }
    }

    fn get_buffer(&self, range: &Range<u64>) -> Option<(usize, Arc<FileViewBuffer>)> {
        for (i, buffer) in self.buffers.iter().enumerate() {
            if buffer.file_offset + (buffer.data.len() as u64) >= range.end && buffer.file_offset <= range.start {
                return Some((i, buffer.clone()))
            }
        }
        None
    }
}

impl FileViewItem {
    pub fn get(&self) -> &[u8] {
        let begin: usize = self.buffer_offset as usize;
        let end: usize = (self.buffer_offset + self.len) as usize;
        &self.buffer.data[begin..end]
    }
}

impl From<io::Error> for FileViewError {
    fn from(_: io::Error) -> Self {
        FileViewError::IOError
    }
}