1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81
// Copyright 2023 Lance Developers.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.
use std::ops::Range;
use std::sync::Arc;
use async_trait::async_trait;
use bytes::Bytes;
use lance_core::Result;
use object_store::{path::Path, ObjectStore};
use crate::traits::Reader;
/// Object Reader
///
/// Object Store + Base Path
#[derive(Debug)]
pub struct CloudObjectReader {
// Object Store.
pub object_store: Arc<dyn ObjectStore>,
// File path
pub path: Path,
block_size: usize,
}
impl CloudObjectReader {
/// Create an ObjectReader from URI
pub fn new(object_store: Arc<dyn ObjectStore>, path: Path, block_size: usize) -> Result<Self> {
Ok(Self {
object_store,
path,
block_size,
})
}
}
#[async_trait]
impl Reader for CloudObjectReader {
fn path(&self) -> &Path {
&self.path
}
fn block_size(&self) -> usize {
self.block_size
}
/// Object/File Size.
async fn size(&self) -> Result<usize> {
Ok(self.object_store.head(&self.path).await?.size)
}
async fn get_range(&self, range: Range<usize>) -> Result<Bytes> {
// Retries for the initial request are handled by object store, but
// there are no retries for failures that occur during the streaming
// of the response body. Thus we add an outer retry loop here.
let mut retries = 3;
loop {
match self.object_store.get_range(&self.path, range.clone()).await {
Ok(bytes) => return Ok(bytes),
Err(err) => {
if retries == 0 {
return Err(err.into());
}
retries -= 1;
}
}
}
}
}