1
  2
  3
  4
  5
  6
  7
  8
  9
 10
 11
 12
 13
 14
 15
 16
 17
 18
 19
 20
 21
 22
 23
 24
 25
 26
 27
 28
 29
 30
 31
 32
 33
 34
 35
 36
 37
 38
 39
 40
 41
 42
 43
 44
 45
 46
 47
 48
 49
 50
 51
 52
 53
 54
 55
 56
 57
 58
 59
 60
 61
 62
 63
 64
 65
 66
 67
 68
 69
 70
 71
 72
 73
 74
 75
 76
 77
 78
 79
 80
 81
 82
 83
 84
 85
 86
 87
 88
 89
 90
 91
 92
 93
 94
 95
 96
 97
 98
 99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
use nom::*;
use std::io::{Result,ErrorKind,Error,Write,BufWriter,Seek,SeekFrom,Cursor};
use std::fs::File;
use std::marker::PhantomData;
use byteorder::{WriteBytesExt, LittleEndian};
use header::{DTypeToValue, Value, DType, parse_header};
pub struct NpyIterator<'a, T> {
    cursor: Cursor<&'a [u8]>,
    remaining: usize,
    _t: PhantomData<T>
}
impl<'a, T> NpyIterator<'a, T> {
    fn new(cursor: Cursor<&'a [u8]>, n_rows: usize) -> Self {
        NpyIterator {
            cursor: cursor,
            remaining: n_rows,
            _t: PhantomData
        }
    }
}
impl<'a, T> Iterator for NpyIterator<'a, T> where T: NpyData {
    type Item = T;
    fn next(&mut self) -> Option<Self::Item> {
        if self.remaining == 0 {
            if let Some(_) = T::read_row(&mut self.cursor) {
                panic!("File was longer than the shape implied.");
            }
            None
        } else {
            self.remaining -= 1;
            Some(T::read_row(&mut self.cursor).expect("File was too short (or the stated shape was too small)."))
        }
    }
}
pub trait NpyData : Sized {
    
    fn get_dtype() -> Vec<(&'static str, DType)>;
    
    fn read_row(c: &mut Cursor<&[u8]>) -> Option<Self>;
    
    fn write_row<W: Write>(&self, writer: &mut W) -> ::std::io::Result<()>;
}
fn cursor_from_bytes<T: NpyData>(bytes: &[u8]) -> Result<(Cursor<&[u8]>, i64)> {
    let (data, header) = match parse_header(bytes) {
        IResult::Done(data, header) => {
            Ok((data, header))
        },
        IResult::Incomplete(needed) => {
            Err(Error::new(ErrorKind::InvalidData, format!("{:?}", needed)))
        },
        IResult::Error(err) => {
            Err(Error::new(ErrorKind::InvalidData, format!("{:?}", err)))
        }
    }?;
    let n_rows: i64 =
        if let Value::Map(ref map) = header {
            if let Some(&Value::List(ref l)) = map.get("shape") {
                if l.len() == 1 {
                    if let Some(&Value::Integer(ref n)) = l.get(0) {
                        Some(*n)
                    } else { None }
                } else { None }
            } else { None }
        } else { None }
        .ok_or(Error::new(ErrorKind::InvalidData,
                "\'shape\' field is not present or doesn't consist of a tuple of length 1."))?;
    let descr: &[Value] =
        if let Value::Map(ref map) = header {
            if let Some(&Value::List(ref l)) = map.get("descr") {
                Some(l)
            } else { None }
        } else { None }
        .ok_or(Error::new(ErrorKind::InvalidData,
                "\'descr\' field is not present or doesn't contain a list."))?;
    let expected_type_ast = T::get_dtype().into_iter().map(|(s,dt)| dt.to_value(&s)).collect::<Vec<_>>();
    
    if expected_type_ast != descr {
        return Err(Error::new(ErrorKind::InvalidData,
            format!("Types don't match! type1: {:?}, type2: {:?}", expected_type_ast, descr)
        ));
    }
    Ok((Cursor::new(data), n_rows))
}
pub fn from_bytes<'a, T: NpyData>(bytes: &'a [u8]) -> ::std::io::Result<NpyIterator<'a, T>> {
    let (cur, n_rows) = cursor_from_bytes::<T>(bytes)?;
    Ok(NpyIterator::new(cur, n_rows as usize))
}
pub fn to_file<S,T>(filename: &str, data: T) -> ::std::io::Result<()> where
        S: NpyData,
        T: IntoIterator<Item=S> {
    let mut fw = BufWriter::new(File::create(filename)?);
    fw.write(&[0x93u8])?;
    fw.write(b"NUMPY")?;
    fw.write(&[0x01u8, 0x00])?;
    let mut header: Vec<u8> = vec![];
    header.extend(&b"{'descr': ["[..]);
    for (id, t) in S::get_dtype() {
        if t.shape.len() == 0 {
            header.extend(format!("('{}', '{}'), ", id, t.ty).as_bytes());
        } else {
            let shape_str = t.shape.into_iter().fold(String::new(), |o,n| o + &format!("{},", n));
            header.extend(format!("('{}', '{}', ({})), ", id, t.ty, shape_str).as_bytes());
        }
    }
    header.extend(&b"], 'fortran_order': False, 'shape': ("[..]);
    let shape_pos = header.len() + 10;
    let filler = &b"abcdefghijklmnopqrs"[..];
    header.extend(filler);
    header.extend(&b",), }"[..]);
    let mut padding: Vec<u8> = vec![];
    padding.extend(&::std::iter::repeat(b' ').take(15 - ((header.len() + 10) % 16)).collect::<Vec<_>>());
    padding.extend(&[b'\n']);
    let len = header.len() + padding.len();
    assert! (len <= ::std::u16::MAX as usize);
    assert!((len + 10) % 16 == 0);
    fw.write_u16::<LittleEndian>(len as u16)?;
    fw.write(&header)?;
    
    fw.write(&padding)?;
    
    let mut num = 0usize;
    for row in data {
        num += 1;
        row.write_row(&mut fw)?;
    }
    
    fw.seek(SeekFrom::Start(shape_pos as u64))?;
    let length = format!("{}", num);
    fw.write(length.as_bytes())?;
    fw.write(&b",), }"[..])?;
    fw.write(&::std::iter::repeat(b' ').take(filler.len() - length.len()).collect::<Vec<_>>())?;
    Ok(())
}