use std::borrow::Cow;
use std::io::{Cursor, Read};
use std::sync::Arc;
use flate2::bufread::{GzDecoder, GzEncoder};
use super::{
GzipCodecConfiguration, GzipCodecConfigurationV1, GzipCompressionLevel,
GzipCompressionLevelError,
};
use crate::array::{ArrayBytesRaw, BytesRepresentation};
use zarrs_codec::{
BytesToBytesCodecTraits, CodecError, CodecMetadataOptions, CodecOptions, CodecTraits,
PartialDecoderCapability, PartialEncoderCapability, RecommendedConcurrency,
};
use zarrs_metadata::Configuration;
use zarrs_plugin::{PluginCreateError, ZarrVersion};
#[derive(Clone, Debug)]
pub struct GzipCodec {
compression_level: GzipCompressionLevel,
}
impl GzipCodec {
pub fn new(compression_level: u32) -> Result<Self, GzipCompressionLevelError> {
let compression_level: GzipCompressionLevel = compression_level.try_into()?;
Ok(Self { compression_level })
}
pub fn new_with_configuration(
configuration: &GzipCodecConfiguration,
) -> Result<Self, PluginCreateError> {
match configuration {
GzipCodecConfiguration::V1(configuration) => Ok(Self {
compression_level: configuration.level,
}),
_ => Err(PluginCreateError::Other(
"this gzip codec configuration variant is unsupported".to_string(),
)),
}
}
}
impl CodecTraits for GzipCodec {
fn as_any(&self) -> &dyn std::any::Any {
self
}
fn configuration(
&self,
_version: ZarrVersion,
_options: &CodecMetadataOptions,
) -> Option<Configuration> {
let configuration = GzipCodecConfiguration::V1(GzipCodecConfigurationV1 {
level: self.compression_level,
});
Some(configuration.into())
}
fn partial_decoder_capability(&self) -> PartialDecoderCapability {
PartialDecoderCapability {
partial_read: false,
partial_decode: false,
}
}
fn partial_encoder_capability(&self) -> PartialEncoderCapability {
PartialEncoderCapability {
partial_encode: false,
}
}
}
#[cfg_attr(
all(feature = "async", not(target_arch = "wasm32")),
async_trait::async_trait
)]
#[cfg_attr(all(feature = "async", target_arch = "wasm32"), async_trait::async_trait(?Send))]
impl BytesToBytesCodecTraits for GzipCodec {
fn into_dyn(self: Arc<Self>) -> Arc<dyn BytesToBytesCodecTraits> {
self as Arc<dyn BytesToBytesCodecTraits>
}
fn recommended_concurrency(
&self,
_decoded_representation: &BytesRepresentation,
) -> Result<RecommendedConcurrency, CodecError> {
Ok(RecommendedConcurrency::new_maximum(1))
}
fn encode<'a>(
&self,
decoded_value: ArrayBytesRaw<'a>,
_options: &CodecOptions,
) -> Result<ArrayBytesRaw<'a>, CodecError> {
let mut encoder = GzEncoder::new(
Cursor::new(decoded_value),
flate2::Compression::new(self.compression_level.as_u32()),
);
let mut out: Vec<u8> = Vec::new();
encoder.read_to_end(&mut out)?;
Ok(Cow::Owned(out))
}
fn decode<'a>(
&self,
encoded_value: ArrayBytesRaw<'a>,
_decoded_representation: &BytesRepresentation,
_options: &CodecOptions,
) -> Result<ArrayBytesRaw<'a>, CodecError> {
let mut decoder = GzDecoder::new(Cursor::new(encoded_value));
let mut out: Vec<u8> = Vec::new();
decoder.read_to_end(&mut out)?;
Ok(Cow::Owned(out))
}
fn encoded_representation(
&self,
decoded_representation: &BytesRepresentation,
) -> BytesRepresentation {
decoded_representation
.size()
.map_or(BytesRepresentation::UnboundedSize, |size| {
const HEADER_TRAILER_OVERHEAD: u64 = 10 + 8; const BLOCK_SIZE: u64 = 32768;
const BLOCK_OVERHEAD: u64 = 5;
let blocks_overhead = BLOCK_OVERHEAD * size.div_ceil(BLOCK_SIZE);
BytesRepresentation::BoundedSize(size + HEADER_TRAILER_OVERHEAD + blocks_overhead)
})
}
}