use std::{fmt, path::Path};
use CompressionFormat::*;
use bstr::ByteSlice;
use crate::{
error::{Error, FinalError, Result},
utils::PathFmt,
warning,
};
pub const SUPPORTED_EXTENSIONS: &[&str] = &[
"tar",
"zip",
"bz",
"bz2",
"gz",
"lz4",
"xz",
"lzma",
"lz",
"sz",
"zst",
#[cfg(feature = "unrar")]
"rar",
"7z",
"br",
];
pub const SUPPORTED_ALIASES: &[&str] = &[
"tgz", "tbz", "tlz4", "txz", "tzlma", "tsz", "tzst", "tlz", "cbt", "cbz", "cb7", "cbr",
];
#[cfg(not(feature = "unrar"))]
pub const PRETTY_SUPPORTED_EXTENSIONS: &str = "tar, zip, bz, bz2, bz3, gz, lz4, xz, lzma, lz, sz, zst, 7z";
#[cfg(feature = "unrar")]
pub const PRETTY_SUPPORTED_EXTENSIONS: &str = "tar, zip, bz, bz2, bz3, gz, lz4, xz, lzma, lz, sz, zst, rar, 7z";
pub const PRETTY_SUPPORTED_ALIASES: &str = "tgz, tbz, tlz4, txz, tlzma, tsz, tzst, tlz, cbt, cbz, cb7, cbr";
#[derive(Debug, Clone)]
#[cfg_attr(test, derive(PartialEq))]
#[non_exhaustive]
pub struct Extension {
pub compression_formats: Vec<CompressionFormat>,
display_text: String,
}
impl Extension {
pub fn new(formats: impl Into<Vec<CompressionFormat>>, text: impl ToString) -> Self {
let compression_formats = formats.into();
assert!(!compression_formats.is_empty());
Self {
compression_formats,
display_text: text.to_string(),
}
}
pub fn from_format(format: CompressionFormat) -> Self {
Self {
compression_formats: vec![format],
display_text: format.as_str().to_owned(),
}
}
pub fn is_archive(&self) -> bool {
self.compression_formats[0].is_archive_format()
}
}
impl fmt::Display for Extension {
fn fmt(&self, f: &mut fmt::Formatter) -> fmt::Result {
self.display_text.fmt(f)
}
}
#[derive(Copy, Clone, PartialEq, Eq, Debug)]
pub enum CompressionFormat {
Gzip,
Bzip,
Bzip3,
Lz4,
Xz,
Lzma,
Lzip,
Snappy,
Tar,
Zstd,
Zip,
Rar,
SevenZip,
Brotli,
}
impl CompressionFormat {
pub fn is_archive_format(&self) -> bool {
match self {
Tar | Zip | Rar | SevenZip => true,
Bzip | Bzip3 | Lz4 | Lzma | Xz | Lzip | Snappy | Zstd | Brotli | Gzip => false,
}
}
pub fn as_str(&self) -> &str {
match self {
Tar => "tar",
Zip => "zip",
Rar => "rar",
SevenZip => "7z",
Brotli => "br",
Gzip => "gz",
Bzip => "bz",
Bzip3 => "bz3",
Lz4 => "lz4",
Xz => "xz",
Lzma => "lzma",
Lzip => "lz",
Snappy => "sz",
Zstd => "zst",
}
}
}
fn slice_to_extension(ext: &[u8]) -> Option<Extension> {
let formats: &[CompressionFormat] = match ext {
b"tar" | b"cbt" => [Tar].as_slice(),
b"tgz" => [Tar, Gzip].as_slice(),
b"tbz" | b"tbz2" => [Tar, Bzip].as_slice(),
b"tbz3" => [Tar, Bzip3].as_slice(),
b"tlz4" => [Tar, Lz4].as_slice(),
b"txz" => [Tar, Xz].as_slice(),
b"tlzma" => [Tar, Lzma].as_slice(),
b"tlz" => [Tar, Lzip].as_slice(),
b"tsz" => [Tar, Snappy].as_slice(),
b"tzst" => [Tar, Zstd].as_slice(),
b"zip" | b"cbz" => [Zip].as_slice(),
b"bz" | b"bz2" => [Bzip].as_slice(),
b"bz3" => [Bzip3].as_slice(),
b"gz" => [Gzip].as_slice(),
b"lz4" => [Lz4].as_slice(),
b"xz" => [Xz].as_slice(),
b"lzma" => [Lzma].as_slice(),
b"lz" => [Lzip].as_slice(),
b"sz" => [Snappy].as_slice(),
b"zst" => [Zstd].as_slice(),
b"rar" | b"cbr" => [Rar].as_slice(),
b"7z" | b"cb7" => [SevenZip].as_slice(),
b"br" => [Brotli].as_slice(),
_ => return None,
};
let extension_text = ext.to_str_lossy();
Some(Extension::new(formats, extension_text))
}
fn split_extension_at_end(name: &[u8]) -> Option<(&[u8], Extension)> {
let (new_name, ext) = name.rsplit_once_str(b".")?;
if matches!(new_name, b"" | b"." | b"..") {
return None;
}
let ext = slice_to_extension(ext)?;
Some((new_name, ext))
}
pub fn parse_format_flag(text: &str) -> Result<Vec<Extension>> {
let extensions: Vec<Extension> = text
.split('.')
.filter(|extension| !extension.is_empty())
.map(|extension| {
slice_to_extension(extension.as_bytes()).ok_or_else(|| Error::InvalidFormatFlag {
text: text.to_owned(),
reason: format!("Unsupported extension '{extension}'"),
})
})
.collect::<Result<_>>()?;
if extensions.is_empty() {
return Err(Error::InvalidFormatFlag {
text: text.to_owned(),
reason: "Parsing got an empty list of extensions.".to_string(),
});
}
Ok(extensions)
}
pub fn separate_known_extensions_from_name(path: &Path) -> Result<(&Path, Vec<Extension>)> {
let mut extensions = vec![];
let Some(mut name) = path.file_name().and_then(<[u8] as ByteSlice>::from_os_str) else {
return Ok((path, extensions));
};
while let Some((new_name, extension)) = split_extension_at_end(name) {
name = new_name;
extensions.insert(0, extension);
if extensions[0].is_archive() {
if let Some((_, misplaced_extension)) = split_extension_at_end(name) {
let mut error = FinalError::with_title("File extensions are invalid for operation").detail(format!(
"The archive extension '.{}' can only be placed at the start of the extension list",
extensions[0].display_text,
));
if misplaced_extension.compression_formats == extensions[0].compression_formats {
error = error.detail(format!(
"File: {} contains '.{}' and '.{}'",
PathFmt(path),
misplaced_extension.display_text,
extensions[0].display_text,
));
}
return Err(error
.hint("You can use `--format` to specify what format to use, examples:")
.hint(" ouch compress file.zip.zip file --format zip")
.hint(" ouch decompress file --format zst")
.hint(" ouch list archive --format tar.gz")
.into());
}
break;
}
}
if let Ok(name) = name.to_str() {
let file_stem = name.trim_matches('.');
if SUPPORTED_EXTENSIONS.contains(&file_stem) || SUPPORTED_ALIASES.contains(&file_stem) {
warning!("Received a file with name '{file_stem}', but {file_stem} was expected as the extension");
}
}
Ok((name.to_path().unwrap(), extensions))
}
pub fn extensions_from_path(path: &Path) -> Result<Vec<Extension>> {
separate_known_extensions_from_name(path).map(|(_, extensions)| extensions)
}
pub fn split_first_compression_format(formats: &[Extension]) -> (CompressionFormat, Vec<CompressionFormat>) {
let mut extensions: Vec<CompressionFormat> = flatten_compression_formats(formats);
let first_extension = extensions.remove(0);
(first_extension, extensions)
}
pub fn flatten_compression_formats(extensions: &[Extension]) -> Vec<CompressionFormat> {
extensions
.iter()
.flat_map(|extension| extension.compression_formats.iter())
.copied()
.collect()
}
pub fn build_archive_file_suggestion(path: &Path, suggested_extension: &str) -> Option<String> {
let path = path.to_string_lossy();
let mut rest = &*path;
let mut position_to_insert = 0;
while let Some(pos) = rest.find('.') {
rest = &rest[pos + 1..];
position_to_insert += pos + 1;
let maybe_extension = {
let idx = rest.find('.').unwrap_or(rest.len());
&rest[..idx]
};
if SUPPORTED_EXTENSIONS.contains(&maybe_extension) || SUPPORTED_ALIASES.contains(&maybe_extension) {
let mut path = path.to_string();
path.insert_str(position_to_insert - 1, suggested_extension);
return Some(path);
}
}
None
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_extensions_from_path() {
let path = Path::new("bolovo.tar.gz");
let extensions = extensions_from_path(path).unwrap();
let formats = flatten_compression_formats(&extensions);
assert_eq!(formats, vec![Tar, Gzip]);
}
#[test]
fn test_separate_known_extensions_from_name() {
assert_eq!(
separate_known_extensions_from_name("file".as_ref()).unwrap(),
("file".as_ref(), vec![])
);
assert_eq!(
separate_known_extensions_from_name("tar".as_ref()).unwrap(),
("tar".as_ref(), vec![])
);
assert_eq!(
separate_known_extensions_from_name(".tar".as_ref()).unwrap(),
(".tar".as_ref(), vec![])
);
assert_eq!(
separate_known_extensions_from_name("file.tar".as_ref()).unwrap(),
("file".as_ref(), vec![Extension::new([Tar], "tar")])
);
assert_eq!(
separate_known_extensions_from_name("file.tar.gz".as_ref()).unwrap(),
(
"file".as_ref(),
vec![Extension::new([Tar], "tar"), Extension::new([Gzip], "gz")]
)
);
assert_eq!(
separate_known_extensions_from_name(".tar.gz".as_ref()).unwrap(),
(".tar".as_ref(), vec![Extension::new([Gzip], "gz")])
);
}
#[test]
fn test_parse_of_format_flag() {
assert_eq!(parse_format_flag("tar").unwrap(), vec![Extension::new([Tar], "tar")]);
assert_eq!(parse_format_flag(".tar").unwrap(), vec![Extension::new([Tar], "tar")]);
assert_eq!(
parse_format_flag("tar.gz").unwrap(),
vec![Extension::new([Tar], "tar"), Extension::new([Gzip], "gz")]
);
assert_eq!(
parse_format_flag(".tar.gz").unwrap(),
vec![Extension::new([Tar], "tar"), Extension::new([Gzip], "gz")]
);
assert_eq!(
parse_format_flag("..tar..gz.....").unwrap(),
vec![Extension::new([Tar], "tar"), Extension::new([Gzip], "gz")]
);
assert!(parse_format_flag("../tar.gz").is_err());
assert!(parse_format_flag("targz").is_err());
assert!(parse_format_flag("tar.gz.unknown").is_err());
assert!(parse_format_flag(".tar.gz.unknown").is_err());
assert!(parse_format_flag(".tar.!@#.gz").is_err());
}
#[test]
fn builds_suggestion_correctly() {
assert_eq!(build_archive_file_suggestion(Path::new("linux.png"), ".tar"), None);
assert_eq!(
build_archive_file_suggestion(Path::new("linux.xz.gz.zst"), ".tar").unwrap(),
"linux.tar.xz.gz.zst"
);
assert_eq!(
build_archive_file_suggestion(Path::new("linux.pkg.xz.gz.zst"), ".tar").unwrap(),
"linux.pkg.tar.xz.gz.zst"
);
assert_eq!(
build_archive_file_suggestion(Path::new("linux.pkg.zst"), ".tar").unwrap(),
"linux.pkg.tar.zst"
);
assert_eq!(
build_archive_file_suggestion(Path::new("linux.pkg.info.zst"), ".tar").unwrap(),
"linux.pkg.info.tar.zst"
);
}
#[test]
fn test_extension_parsing_with_multiple_archive_formats() {
assert!(separate_known_extensions_from_name("file.tar.zip".as_ref()).is_err());
assert!(separate_known_extensions_from_name("file.7z.zst.zip.lz4".as_ref()).is_err());
}
}