mod error;
mod util;
use cid::Cid;
pub use error::*;
use futures::{AsyncRead, AsyncWrite, Stream, StreamExt};
use fvm_shared::blockstore::Blockstore;
use fvm_shared::encoding::{from_slice, to_vec};
use serde::{Deserialize, Serialize};
use util::{ld_read, ld_write, read_node};
#[derive(Debug, Default, Serialize, Deserialize, PartialEq)]
pub struct CarHeader {
pub roots: Vec<Cid>,
pub version: u64,
}
impl CarHeader {
pub fn new(roots: Vec<Cid>, version: u64) -> Self {
Self { roots, version }
}
pub async fn write_stream_async<W, S>(
&self,
writer: &mut W,
stream: &mut S,
) -> Result<(), Error>
where
W: AsyncWrite + Send + Unpin,
S: Stream<Item = (Cid, Vec<u8>)> + Unpin,
{
let header_bytes = to_vec(self)?;
ld_write(writer, &header_bytes).await?;
while let Some((cid, bytes)) = stream.next().await {
ld_write(writer, &[cid.to_bytes(), bytes].concat()).await?;
}
Ok(())
}
}
impl From<Vec<Cid>> for CarHeader {
fn from(roots: Vec<Cid>) -> Self {
Self { roots, version: 1 }
}
}
pub struct CarReader<R> {
pub reader: R,
pub header: CarHeader,
}
impl<R> CarReader<R>
where
R: AsyncRead + Send + Unpin,
{
pub async fn new(mut reader: R) -> Result<Self, Error> {
let buf = ld_read(&mut reader)
.await?
.ok_or_else(|| Error::ParsingError("failed to parse uvarint for header".to_string()))?;
let header: CarHeader = from_slice(&buf).map_err(|e| Error::ParsingError(e.to_string()))?;
if header.roots.is_empty() {
return Err(Error::ParsingError("empty CAR file".to_owned()));
}
if header.version != 1 {
return Err(Error::InvalidFile("CAR file version must be 1".to_owned()));
}
Ok(CarReader { reader, header })
}
pub async fn next_block(&mut self) -> Result<Option<Block>, Error> {
let block = read_node(&mut self.reader)
.await?
.map(|(cid, data)| Block { cid, data });
Ok(block)
}
}
#[derive(Clone, Debug)]
pub struct Block {
cid: Cid,
data: Vec<u8>,
}
pub async fn load_car<R, B>(s: &B, reader: R) -> Result<Vec<Cid>, Error>
where
B: Blockstore,
R: AsyncRead + Send + Unpin,
{
let mut car_reader = CarReader::new(reader).await?;
let mut buf = Vec::with_capacity(100);
while let Some(block) = car_reader.next_block().await? {
buf.push((block.cid, block.data));
if buf.len() > 1000 {
s.put_many_keyed(buf.iter().map(|(k, v)| (*k, &*v)))
.map_err(|e| Error::Other(e.to_string()))?;
buf.clear();
}
}
s.put_many_keyed(buf.iter().map(|(k, v)| (*k, &*v)))
.map_err(|e| Error::Other(e.to_string()))?;
Ok(car_reader.header.roots)
}
#[cfg(test)]
mod tests {
use std::sync::Arc;
use async_std::channel::bounded;
use async_std::io::Cursor;
use async_std::sync::RwLock;
use cid::multihash::Code::Blake2b256;
use cid::multihash::MultihashDigest;
use fvm_shared::blockstore::MemoryBlockstore;
use fvm_shared::encoding::DAG_CBOR;
use super::*;
#[test]
fn symmetric_header() {
let cid = Cid::new_v1(DAG_CBOR, Blake2b256.digest(b"test"));
let header = CarHeader {
roots: vec![cid],
version: 1,
};
let bytes = to_vec(&header).unwrap();
assert_eq!(from_slice::<CarHeader>(&bytes).unwrap(), header);
}
#[async_std::test]
async fn car_write_read() {
let buffer: Arc<RwLock<Vec<u8>>> = Default::default();
let cid = Cid::new_v1(DAG_CBOR, Blake2b256.digest(b"test"));
let header = CarHeader {
roots: vec![cid],
version: 1,
};
assert_eq!(to_vec(&header).unwrap().len(), 60);
let (tx, mut rx) = bounded(10);
let buffer_cloned = buffer.clone();
let write_task = async_std::task::spawn(async move {
header
.write_stream_async(&mut *buffer_cloned.write().await, &mut rx)
.await
.unwrap()
});
tx.send((cid, b"test".to_vec())).await.unwrap();
drop(tx);
write_task.await;
let buffer: Vec<_> = buffer.read().await.clone();
let reader = Cursor::new(&buffer);
let bs = MemoryBlockstore::default();
load_car(&bs, reader).await.unwrap();
assert_eq!(bs.get(&cid).unwrap(), Some(b"test".to_vec()));
}
}