use std::path::PathBuf;
use colored::Colorize;
use crate::{
cli::{args::sequence::SequenceFilterArgs, collect_paths, AlignSeqInput, InputCli, OutputCli},
core::sequence::filter::{SeqFilteringParameters, SequenceFiltering},
helper::logger::AlignSeqLogger,
};
impl InputCli for SequenceFilterParser<'_> {}
impl OutputCli for SequenceFilterParser<'_> {}
impl AlignSeqInput for SequenceFilterParser<'_> {}
pub(in crate::cli) struct SequenceFilterParser<'a> {
args: &'a SequenceFilterArgs,
input_dir: Option<PathBuf>,
params: SeqFilteringParameters,
counter_params: usize,
}
impl<'a> SequenceFilterParser<'a> {
pub(in crate::cli) fn new(args: &'a SequenceFilterArgs) -> Self {
Self {
args,
input_dir: None,
params: SeqFilteringParameters::None,
counter_params: 0,
}
}
pub(in crate::cli) fn filter(&mut self) {
let input_fmt = self.parse_input_fmt(&self.args.in_fmt.input_fmt);
let datatype = self.parse_datatype(&self.args.in_fmt.datatype);
let output_fmt = self.parse_output_fmt(&self.args.out_fmt.output_fmt);
let dir = &self.args.io.dir;
let files = collect_paths!(self, dir, input_fmt);
let task = "Filter sequences";
AlignSeqLogger::new(
self.input_dir.as_deref(),
&input_fmt,
&datatype,
files.len(),
)
.log(task);
self.check_output_dir_exist(&self.args.output, self.args.io.force);
log::info!("{}", "Filtering Parameters".yellow());
self.parse_params();
self.check_multiple_params();
let filter = SequenceFiltering::new(
&files,
&input_fmt,
&datatype,
&self.args.output,
&output_fmt,
&self.params,
);
filter.filter();
}
fn parse_params(&mut self) {
if let Some(min_len) = self.args.min_len {
log::info!("{:18}: {}\n", "Minimum length", min_len);
self.params = SeqFilteringParameters::MinSequenceLength(min_len);
self.counter_params += 1;
}
if let Some(max_gap) = self.args.max_gap {
log::info!("{:18}: {}\n", "Max gaps", format!("{}%", max_gap * 100.0));
self.params = SeqFilteringParameters::PercentMaxGap(max_gap);
self.counter_params += 1;
}
if let Some(max_len) = self.args.max_len {
log::info!("{:18}: {}\n", "Maximum length", max_len);
self.params = SeqFilteringParameters::MaxSequenceLength(max_len);
self.counter_params += 1;
}
}
fn check_multiple_params(&self) {
if self.counter_params > 1 {
log::warn!("Multiple parameters are set. Only one parameter is allowed at a time!");
std::process::exit(0);
}
}
}