1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
use crate::bucket::CHUNK_SIZE;
use crate::Result;
use async_std::fs::File;
use async_std::path::Path;
use futures::io::{AsyncRead, AsyncReadExt};
pub async fn etag_for_path(path: impl AsRef<Path>) -> Result<String> {
let mut file = File::open(path).await?;
let mut digests = Vec::new();
let mut chunks = 0;
loop {
let chunk = read_chunk(&mut file).await?;
let digest: [u8; 16] = md5::compute(&chunk).into();
digests.extend_from_slice(&digest);
chunks += 1;
if chunk.len() < CHUNK_SIZE {
break;
}
}
let digest = format!("{:x}", md5::compute(digests));
let etag = if chunks <= 1 {
digest
} else {
format!("{}-{}", digest, chunks)
};
Ok(etag)
}
pub async fn read_chunk<R: AsyncRead + Unpin>(reader: &mut R) -> Result<Vec<u8>> {
const LOCAL_CHUNK_SIZE: usize = 8388;
let mut chunk = Vec::with_capacity(CHUNK_SIZE);
loop {
let mut buffer = [0; LOCAL_CHUNK_SIZE];
let mut take = reader.take(LOCAL_CHUNK_SIZE as u64);
let n = take.read(&mut buffer).await?;
if n < LOCAL_CHUNK_SIZE {
buffer.reverse();
let mut trim_buffer = buffer
.iter()
.skip_while(|x| **x == 0)
.copied()
.collect::<Vec<u8>>();
trim_buffer.reverse();
chunk.extend_from_slice(&trim_buffer);
chunk.shrink_to_fit();
break;
} else {
chunk.extend_from_slice(&buffer);
if chunk.len() >= CHUNK_SIZE {
break;
} else {
continue;
}
}
}
Ok(chunk)
}
#[cfg(test)]
mod test {
use crate::utils::etag_for_path;
use std::fs::File;
use std::io::prelude::*;
fn object(size: u32) -> Vec<u8> {
(0..size).map(|_| 33).collect()
}
#[tokio::test]
async fn test_etag() {
let path = "test_etag";
std::fs::remove_file(path).unwrap_or_else(|_| {});
let test: Vec<u8> = object(10_000_000);
let mut file = File::create(path).unwrap();
file.write_all(&test).unwrap();
let etag = etag_for_path(path).await.unwrap();
std::fs::remove_file(path).unwrap_or_else(|_| {});
assert_eq!(etag, "ae890066cc055c740b3dc3c8854a643b-2");
}
}