use std::fs::File;
use std::io::{BufReader, BufWriter, Write};
use std::path::PathBuf;
use clap::Parser;
use rsomics_common::{CommonFlags, Result, RsomicsError, Tool, ToolMeta};
use rsomics_help::{Example, FlagSpec, HelpSpec, Origin, Section};
use rsomics_anosim::run;
pub const META: ToolMeta = ToolMeta {
name: env!("CARGO_PKG_NAME"),
version: env!("CARGO_PKG_VERSION"),
};
#[derive(Parser, Debug)]
#[command(name = "rsomics-anosim", version, about, long_about = None, disable_help_flag = true)]
pub struct Cli {
#[arg(default_value = "-")]
input: PathBuf,
#[arg(long)]
grouping: PathBuf,
#[arg(long, default_value_t = 999)]
permutations: usize,
#[arg(long, default_value_t = false)]
csv: bool,
#[arg(short = 'o', long, default_value = "-")]
output: String,
#[command(flatten)]
pub common: CommonFlags,
}
impl Tool for Cli {
fn meta() -> ToolMeta {
META
}
fn common(&self) -> &CommonFlags {
&self.common
}
fn execute(self) -> Result<()> {
self.common.install_rayon_pool()?;
let delim = if self.csv { ',' } else { '\t' };
let dm_reader: Box<dyn std::io::BufRead> = if self.input.as_os_str() == "-" {
Box::new(BufReader::new(std::io::stdin().lock()))
} else {
Box::new(BufReader::new(File::open(&self.input).map_err(|e| {
RsomicsError::InvalidInput(format!("{}: {e}", self.input.display()))
})?))
};
let grouping_reader = BufReader::new(File::open(&self.grouping).map_err(|e| {
RsomicsError::InvalidInput(format!("{}: {e}", self.grouping.display()))
})?);
let mut out: Box<dyn Write> = if self.output == "-" {
Box::new(BufWriter::new(std::io::stdout().lock()))
} else {
Box::new(BufWriter::new(
File::create(&self.output).map_err(RsomicsError::Io)?,
))
};
let seed = self.common.seed.unwrap_or(0);
run(
dm_reader,
grouping_reader,
&mut out,
delim,
self.permutations,
seed,
)?;
out.flush().map_err(RsomicsError::Io)
}
}
pub static HELP: HelpSpec = HelpSpec {
name: env!("CARGO_PKG_NAME"),
version: env!("CARGO_PKG_VERSION"),
tagline: "ANOSIM test for group differences from a distance matrix.",
origin: Some(Origin {
upstream: "scikit-bio skbio.stats.distance.anosim",
upstream_license: "BSD-3-Clause",
our_license: "MIT OR Apache-2.0",
paper_doi: Some("10.1111/j.1442-9993.1993.tb00438.x"),
}),
usage_lines: &[
"[distance_matrix.tsv] --grouping groups.tsv [--permutations 999] [-o result.tsv]",
],
sections: &[Section {
title: "OPTIONS",
flags: &[
FlagSpec {
short: None,
long: "grouping",
aliases: &[],
value: Some("<path>"),
type_hint: None,
required: true,
default: None,
description: "Grouping TSV (id<TAB>group per sample).",
why_default: None,
},
FlagSpec {
short: None,
long: "permutations",
aliases: &[],
value: Some("<n>"),
type_hint: Some("usize"),
required: false,
default: Some("999"),
description: "Permutations for the p-value (0 skips it).",
why_default: None,
},
FlagSpec {
short: None,
long: "csv",
aliases: &[],
value: None,
type_hint: None,
required: false,
default: Some("false"),
description: "Parse the distance matrix as comma-separated.",
why_default: None,
},
FlagSpec {
short: Some('o'),
long: "output",
aliases: &[],
value: Some("<path>"),
type_hint: Some("String"),
required: false,
default: Some("-"),
description: "Output path (- for stdout).",
why_default: None,
},
],
}],
examples: &[
Example {
description: "ANOSIM with 999 permutations",
command: "rsomics-anosim dm.tsv --grouping groups.tsv",
},
Example {
description: "Pipe a Bray-Curtis matrix from rsomics-beta-diversity",
command: "rsomics-beta-diversity counts.tsv | rsomics-anosim --grouping groups.tsv",
},
],
json_result_schema_doc: None,
};
#[cfg(test)]
mod tests {
use super::*;
use clap::CommandFactory;
#[test]
fn cli_debug_assert() {
Cli::command().debug_assert();
}
}