use std::borrow::Cow;
use crate::base::write::get_or_put_info_zip_unicode_comment_extra_field_mut;
use crate::base::write::get_or_put_info_zip_unicode_path_extra_field_mut;
use crate::base::write::{CentralDirectoryEntry, ZipFileWriter};
use crate::entry::ZipEntry;
use crate::error::{Result, Zip64ErrorCase, ZipError};
use crate::spec::extra_field::Zip64ExtendedInformationExtraFieldBuilder;
use crate::spec::header::{InfoZipUnicodeCommentExtraField, InfoZipUnicodePathExtraField};
use crate::spec::{
extra_field::ExtraFieldAsBytes,
header::{CentralDirectoryRecord, ExtraField, GeneralPurposeFlag, LocalFileHeader},
Compression,
};
use crate::StringEncoding;
#[cfg(any(feature = "deflate", feature = "bzip2", feature = "zstd", feature = "lzma", feature = "xz"))]
use futures_lite::io::Cursor;
use crate::spec::consts::{NON_ZIP64_MAX_NUM_FILES, NON_ZIP64_MAX_SIZE};
#[cfg(any(feature = "deflate", feature = "bzip2", feature = "zstd", feature = "lzma", feature = "xz"))]
use async_compression::futures::write;
use futures_lite::io::{AsyncWrite, AsyncWriteExt};
pub struct EntryWholeWriter<'b, 'c, W: AsyncWrite + Unpin> {
writer: &'b mut ZipFileWriter<W>,
entry: ZipEntry,
data: Cow<'c, [u8]>,
builder: Option<Zip64ExtendedInformationExtraFieldBuilder>,
lh_offset: u64,
precompressed: bool,
}
impl<'b, 'c, W: AsyncWrite + Unpin> EntryWholeWriter<'b, 'c, W> {
pub fn from_raw(writer: &'b mut ZipFileWriter<W>, entry: ZipEntry, data: &'c [u8]) -> Self {
Self { writer, entry, data: Cow::Borrowed(data), builder: None, lh_offset: 0, precompressed: false }
}
pub fn from_precompressed(writer: &'b mut ZipFileWriter<W>, entry: ZipEntry, data: &'c [u8]) -> Self {
Self { writer, entry, data: Cow::Borrowed(data), builder: None, lh_offset: 0, precompressed: true }
}
async fn compress(&mut self) {
if self.entry.compression() == Compression::Stored {
return;
}
#[cfg(any(
feature = "deflate",
feature = "bzip2",
feature = "zstd",
feature = "lzma",
feature = "xz",
feature = "deflate64"
))]
{
let new_data = compress(&self.entry, &self.data).await;
self.data = Cow::Owned(new_data);
}
}
fn enforce_zip64_sizes(&mut self) -> Result<()> {
let uncompressed_larger = self.entry.uncompressed_size > NON_ZIP64_MAX_SIZE.into();
let compressed_larger = self.entry.compressed_size > NON_ZIP64_MAX_SIZE.into();
if !uncompressed_larger && !compressed_larger {
return Ok(());
}
self.enforce_zip64()?;
let builder = Zip64ExtendedInformationExtraFieldBuilder::new();
let builder = builder.sizes(self.entry.compressed_size(), self.entry.uncompressed_size());
self.builder = Some(builder);
self.entry.uncompressed_size = NON_ZIP64_MAX_SIZE.into();
self.entry.compressed_size = NON_ZIP64_MAX_SIZE.into();
Ok(())
}
fn enforce_zip64_offset(&mut self) -> Result<()> {
if self.lh_offset <= NON_ZIP64_MAX_SIZE.into() {
return Ok(());
}
self.enforce_zip64()?;
let builder = self.builder.take().unwrap_or(Zip64ExtendedInformationExtraFieldBuilder::new());
let builder = builder.relative_header_offset(self.lh_offset);
self.builder = Some(builder);
self.lh_offset = NON_ZIP64_MAX_SIZE.into();
Ok(())
}
fn enforce_zip64(&mut self) -> Result<()> {
if self.writer.force_no_zip64 {
return Err(ZipError::Zip64Needed(Zip64ErrorCase::LargeFile));
}
if !self.writer.is_zip64 {
self.writer.is_zip64 = true;
}
Ok(())
}
fn utf8_without_alternative(&mut self) -> bool {
let utf8_without_alternative =
self.entry.filename().is_utf8_without_alternative() && self.entry.comment().is_utf8_without_alternative();
if !utf8_without_alternative {
if matches!(self.entry.filename().encoding(), StringEncoding::Utf8) {
let u_file_name = self.entry.filename().as_bytes().to_vec();
if !u_file_name.is_empty() {
let basic_crc32 = crc32fast::hash(
self.entry.filename().alternative().unwrap_or_else(|| self.entry.filename().as_bytes()),
);
let upath_field =
get_or_put_info_zip_unicode_path_extra_field_mut(self.entry.extra_fields.as_mut());
if let InfoZipUnicodePathExtraField::V1 { crc32, unicode } = upath_field {
*crc32 = basic_crc32;
*unicode = u_file_name;
}
}
}
if matches!(self.entry.comment().encoding(), StringEncoding::Utf8) {
let u_comment = self.entry.comment().as_bytes().to_vec();
if !u_comment.is_empty() {
let basic_crc32 = crc32fast::hash(
self.entry.comment().alternative().unwrap_or_else(|| self.entry.comment().as_bytes()),
);
let ucom_field =
get_or_put_info_zip_unicode_comment_extra_field_mut(self.entry.extra_fields.as_mut());
if let InfoZipUnicodeCommentExtraField::V1 { crc32, unicode } = ucom_field {
*crc32 = basic_crc32;
*unicode = u_comment;
}
}
}
}
utf8_without_alternative
}
pub async fn write(mut self) -> Result<()> {
if !self.precompressed {
self.entry.uncompressed_size = self.data.len() as u64;
self.entry.crc32 = crc32fast::hash(&self.data);
self.compress().await;
}
self.entry.compressed_size = self.data.len() as u64;
self.enforce_zip64_sizes()?;
self.lh_offset = self.writer.writer.offset();
self.enforce_zip64_offset()?;
if let Some(builder) = self.builder {
if !builder.eof_only() {
self.entry.extra_fields.push(ExtraField::Zip64ExtendedInformation(builder.build()?));
self.builder = None;
} else {
self.builder = Some(builder);
}
}
let utf8_without_alternative = self.utf8_without_alternative();
let filename_basic = self.entry.filename().alternative().unwrap_or_else(|| self.entry.filename().as_bytes());
let comment_basic = self.entry.comment().alternative().unwrap_or_else(|| self.entry.comment().as_bytes());
let lf_header = LocalFileHeader {
compressed_size: self.entry.compressed_size() as u32,
uncompressed_size: self.entry.uncompressed_size() as u32,
compression: self.entry.compression().into(),
crc: self.entry.crc32(),
extra_field_length: self
.entry
.extra_fields()
.count_bytes()
.try_into()
.map_err(|_| ZipError::ExtraFieldTooLarge)?,
file_name_length: filename_basic.len().try_into().map_err(|_| ZipError::FileNameTooLarge)?,
mod_time: self.entry.last_modification_date().time,
mod_date: self.entry.last_modification_date().date,
version: crate::spec::version::as_needed_to_extract(&self.entry),
flags: GeneralPurposeFlag {
data_descriptor: false,
encrypted: false,
filename_unicode: utf8_without_alternative,
},
};
let mut header = CentralDirectoryRecord {
v_made_by: crate::spec::version::as_made_by(),
v_needed: lf_header.version,
compressed_size: lf_header.compressed_size,
uncompressed_size: lf_header.uncompressed_size,
compression: lf_header.compression,
crc: lf_header.crc,
extra_field_length: lf_header.extra_field_length,
file_name_length: lf_header.file_name_length,
file_comment_length: comment_basic.len().try_into().map_err(|_| ZipError::CommentTooLarge)?,
mod_time: lf_header.mod_time,
mod_date: lf_header.mod_date,
flags: lf_header.flags,
disk_start: 0,
inter_attr: self.entry.internal_file_attribute(),
exter_attr: self.entry.external_file_attribute(),
lh_offset: self.lh_offset as u32,
};
self.writer.writer.write_all(&crate::spec::consts::LFH_SIGNATURE.to_le_bytes()).await?;
self.writer.writer.write_all(&lf_header.as_slice()).await?;
self.writer.writer.write_all(filename_basic).await?;
self.writer.writer.write_all(&self.entry.extra_fields().as_bytes()).await?;
self.writer.writer.write_all(&self.data).await?;
if let Some(builder1) = self.builder {
self.entry.extra_fields.push(ExtraField::Zip64ExtendedInformation(builder1.build()?));
header.extra_field_length =
self.entry.extra_fields().count_bytes().try_into().map_err(|_| ZipError::ExtraFieldTooLarge)?;
}
self.writer.cd_entries.push(CentralDirectoryEntry { header, entry: self.entry });
if self.writer.cd_entries.len() > NON_ZIP64_MAX_NUM_FILES as usize {
if self.writer.force_no_zip64 {
return Err(ZipError::Zip64Needed(Zip64ErrorCase::TooManyFiles));
}
if !self.writer.is_zip64 {
self.writer.is_zip64 = true;
}
}
Ok(())
}
}
#[cfg(any(
feature = "deflate",
feature = "bzip2",
feature = "zstd",
feature = "lzma",
feature = "xz",
feature = "deflate64"
))]
pub async fn compress(entry: &ZipEntry, data: &[u8]) -> Vec<u8> {
let level = entry.compression_level;
match entry.compression() {
#[cfg(feature = "deflate")]
Compression::Deflate => {
let mut writer = write::DeflateEncoder::with_quality(Cursor::new(Vec::new()), level);
writer.write_all(data).await.unwrap();
writer.close().await.unwrap();
writer.into_inner().into_inner()
}
#[cfg(feature = "deflate64")]
Compression::Deflate64 => panic!("compressing deflate64 is not supported"),
#[cfg(feature = "bzip2")]
Compression::Bz => {
let mut writer = write::BzEncoder::with_quality(Cursor::new(Vec::new()), level);
writer.write_all(data).await.unwrap();
writer.close().await.unwrap();
writer.into_inner().into_inner()
}
#[cfg(feature = "lzma")]
Compression::Lzma => {
let mut writer = write::LzmaEncoder::with_quality(Cursor::new(Vec::new()), level);
writer.write_all(data).await.unwrap();
writer.close().await.unwrap();
writer.into_inner().into_inner()
}
#[cfg(feature = "xz")]
Compression::Xz => {
let mut writer = write::XzEncoder::with_quality(Cursor::new(Vec::new()), level);
writer.write_all(data).await.unwrap();
writer.close().await.unwrap();
writer.into_inner().into_inner()
}
#[cfg(feature = "zstd")]
Compression::Zstd => {
let mut writer = write::ZstdEncoder::with_quality(Cursor::new(Vec::new()), level);
writer.write_all(data).await.unwrap();
writer.close().await.unwrap();
writer.into_inner().into_inner()
}
_ => unreachable!(),
}
}
pub fn crc32(data: &[u8]) -> u32 {
crc32fast::hash(data)
}