pub mod index;
pub mod iterators;
mod array;
mod slice;
pub use array::SeqArray;
pub use slice::SeqSlice;
use crate::codec::{text, Codec};
use crate::error::ParseBioError;
use crate::{Bs, Bv, Order};
use bitvec::field::BitField;
use bitvec::view::BitView;
#[cfg(feature = "serde")]
use serde::{Deserialize, Serialize};
use core::borrow::Borrow;
use core::fmt;
use core::marker::PhantomData;
use core::ops::Deref;
use core::ptr;
use core::str;
use core::str::FromStr;
#[derive(Debug, Eq, PartialEq, PartialOrd, Ord, Hash)]
#[cfg_attr(feature = "serde", derive(Serialize, Deserialize))]
#[repr(transparent)]
pub struct Seq<A: Codec> {
pub(crate) _p: PhantomData<A>,
pub(crate) bv: Bv,
}
impl<A: Codec> From<Seq<A>> for usize {
fn from(slice: Seq<A>) -> usize {
assert!(slice.bv.len() <= usize::BITS as usize);
slice.bv.load_le::<usize>() }
}
pub trait ReverseComplement {
type Output;
fn revcomp(&self) -> Self::Output;
}
impl<A: Codec> Default for Seq<A> {
fn default() -> Self {
Self::new()
}
}
impl<A: Codec> Seq<A> {
pub fn new() -> Self {
Seq {
_p: PhantomData,
bv: Bv::new(),
}
}
pub fn trim_u8(v: &[u8]) -> Result<Self, ParseBioError> {
let start = v
.iter()
.position(|&byte| A::try_from_ascii(byte).is_some())
.unwrap_or(v.len());
let end = v[start..]
.iter()
.rposition(|&byte| A::try_from_ascii(byte).is_some())
.map_or(start, |pos| start + pos + 1);
v[start..end]
.iter()
.map(|&byte| A::try_from_ascii(byte).ok_or(ParseBioError::UnrecognisedBase(byte)))
.collect()
}
pub fn with_capacity(len: usize) -> Self {
Seq {
_p: PhantomData,
bv: Bv::with_capacity(len * A::BITS as usize),
}
}
pub fn nth(&self, i: usize) -> A {
A::unsafe_from_bits(self[i].into())
}
pub fn get(&self, i: usize) -> Option<A> {
if i >= self.bv.len() / A::BITS as usize {
None
} else {
Some(A::unsafe_from_bits(self[i].into()))
}
}
pub fn len(&self) -> usize {
self.bv.len() / A::BITS as usize
}
pub fn is_empty(&self) -> bool {
self.len() == 0
}
pub fn bit_and(self, rhs: Seq<A>) -> Seq<A> {
Seq::<A> {
_p: PhantomData,
bv: Bv::from_bitslice(&(self.bv & rhs.bv)),
}
}
pub fn bit_or(self, rhs: Seq<A>) -> Seq<A> {
Seq::<A> {
_p: PhantomData,
bv: Bv::from_bitslice(&(self.bv | rhs.bv)),
}
}
pub fn push(&mut self, item: A) {
let byte: u8 = item.to_bits();
self.bv
.extend_from_bitslice(&byte.view_bits::<Order>()[..A::BITS as usize]);
}
pub fn clear(&mut self) {
self.bv.clear();
}
pub fn pop(&mut self) -> Option<A> {
unimplemented!()
}
pub fn truncate(&mut self, _len: usize) {
unimplemented!()
}
pub fn remove(&mut self, _index: usize) -> A {
unimplemented!()
}
pub fn insert(&mut self, _index: usize, _element: A) {
unimplemented!()
}
pub fn extend<I: IntoIterator<Item = A>>(&mut self, iter: I) {
iter.into_iter().for_each(|base| self.push(base));
}
pub fn from_raw(len: usize, bits: &[usize]) -> Self {
let mut bv: Bv = Bv::from_slice(bits);
bv.truncate(len * A::BITS as usize);
Seq {
_p: PhantomData,
bv,
}
}
pub fn into_raw(&self) -> &[usize] {
self.bv.as_raw_slice()
}
}
impl<A: Codec, const N: usize, const W: usize> PartialEq<SeqArray<A, N, W>> for Seq<A> {
fn eq(&self, other: &SeqArray<A, N, W>) -> bool {
self.as_ref() == other.as_ref()
}
}
impl<A: Codec, const N: usize, const W: usize> PartialEq<&SeqArray<A, N, W>> for Seq<A> {
fn eq(&self, other: &&SeqArray<A, N, W>) -> bool {
self.as_ref() == other.as_ref()
}
}
impl<A: Codec, const N: usize, const W: usize> PartialEq<Seq<A>> for SeqArray<A, N, W> {
fn eq(&self, other: &Seq<A>) -> bool {
self.as_ref() == other.as_ref()
}
}
impl<A: Codec, const N: usize, const W: usize> PartialEq<Seq<A>> for &SeqArray<A, N, W> {
fn eq(&self, other: &Seq<A>) -> bool {
self.as_ref() == other.as_ref()
}
}
impl<A: Codec> PartialEq<SeqSlice<A>> for Seq<A> {
fn eq(&self, other: &SeqSlice<A>) -> bool {
self.as_ref() == other
}
}
impl<A: Codec> PartialEq<&SeqSlice<A>> for Seq<A> {
fn eq(&self, other: &&SeqSlice<A>) -> bool {
self.as_ref() == *other
}
}
impl<A: Codec> PartialEq<Seq<A>> for SeqSlice<A> {
fn eq(&self, other: &Seq<A>) -> bool {
self == other.as_ref()
}
}
impl<A: Codec> PartialEq<Seq<A>> for &SeqSlice<A> {
fn eq(&self, other: &Seq<A>) -> bool {
*self == other.as_ref()
}
}
impl<A: Codec> PartialEq<Seq<A>> for &Seq<A> {
fn eq(&self, other: &Seq<A>) -> bool {
**self == *other
}
}
impl<A: Codec> PartialEq<&Seq<A>> for Seq<A> {
fn eq(&self, other: &&Seq<A>) -> bool {
*self == **other
}
}
impl<A: Codec> Borrow<SeqSlice<A>> for Seq<A> {
fn borrow(&self) -> &SeqSlice<A> {
self
}
}
impl<A: Codec> Deref for Seq<A> {
type Target = SeqSlice<A>;
fn deref(&self) -> &Self::Target {
let bs: *const Bs = ptr::from_ref::<Bs>(&self.bv);
unsafe { &*(bs as *const SeqSlice<A>) }
}
}
impl<A: Codec> AsRef<SeqSlice<A>> for Seq<A> {
fn as_ref(&self) -> &SeqSlice<A> {
self
}
}
impl<A: Codec> Clone for Seq<A> {
fn clone(&self) -> Self {
Self {
_p: PhantomData,
bv: self.bv.clone(),
}
}
}
impl<A: Codec> FromIterator<A> for Seq<A> {
fn from_iter<I: IntoIterator<Item = A>>(iter: I) -> Self {
let i = iter.into_iter();
let mut seq = Seq::with_capacity(i.size_hint().0);
seq.extend(i);
seq
}
}
impl<A: Codec> From<&Vec<A>> for Seq<A> {
fn from(vec: &Vec<A>) -> Self {
vec.iter().copied().collect()
}
}
impl<A: Codec, B: Codec> From<&SeqSlice<A>> for Seq<B>
where
A: Into<B>,
{
fn from(slice: &SeqSlice<A>) -> Self {
slice.iter().map(Into::into).collect()
}
}
impl<A: Codec, B: Codec, const N: usize, const W: usize> From<&SeqArray<A, N, W>> for Seq<B>
where
A: Into<B>,
{
fn from(slice: &SeqArray<A, N, W>) -> Self {
slice.iter().map(Into::into).collect()
}
}
impl<A: Codec, B: Codec, const N: usize, const W: usize> From<SeqArray<A, N, W>> for Seq<B>
where
A: Into<B>,
{
fn from(slice: SeqArray<A, N, W>) -> Self {
slice.iter().map(Into::into).collect()
}
}
impl<A: Codec> TryFrom<&str> for Seq<A> {
type Error = ParseBioError;
fn try_from(s: &str) -> Result<Self, Self::Error> {
Seq::<A>::try_from(s.as_bytes())
}
}
impl<A: Codec> TryFrom<String> for Seq<A> {
type Error = ParseBioError;
fn try_from(s: String) -> Result<Self, Self::Error> {
Seq::<A>::try_from(s.as_str())
}
}
impl<A: Codec> TryFrom<&String> for Seq<A> {
type Error = ParseBioError;
fn try_from(s: &String) -> Result<Self, Self::Error> {
Seq::<A>::try_from(s.as_str())
}
}
impl<A: Codec> FromStr for Seq<A> {
type Err = ParseBioError;
fn from_str(s: &str) -> Result<Self, Self::Err> {
Seq::<A>::try_from(s)
}
}
impl<A: Codec> TryFrom<&[u8]> for Seq<A> {
type Error = ParseBioError;
fn try_from(v: &[u8]) -> Result<Self, Self::Error> {
Self::try_from(v.to_vec())
}
}
impl<A: Codec> TryFrom<Vec<u8>> for Seq<A> {
type Error = ParseBioError;
fn try_from(v: Vec<u8>) -> Result<Self, Self::Error> {
v.into_iter()
.map(|byte| A::try_from_ascii(byte).ok_or(ParseBioError::UnrecognisedBase(byte)))
.collect()
}
}
impl<A: Codec> From<Seq<A>> for String {
fn from(seq: Seq<A>) -> Self {
String::from(seq.as_ref())
}
}
impl<A: Codec> From<&Seq<A>> for String {
fn from(seq: &Seq<A>) -> Self {
String::from(seq.as_ref())
}
}
impl<A: Codec> fmt::Display for Seq<A> {
fn fmt(&self, f: &mut fmt::Formatter<'_>) -> fmt::Result {
fmt::Display::fmt(self.as_ref(), f)
}
}
impl<A: Codec> Extend<A> for Seq<A> {
fn extend<T: IntoIterator<Item = A>>(&mut self, iter: T) {
self.extend(iter);
}
}
impl From<Vec<usize>> for Seq<text::Dna> {
fn from(vec: Vec<usize>) -> Self {
Seq {
_p: PhantomData,
bv: Bv::from_vec(vec),
}
}
}
impl<A: Codec> From<&Bs> for Seq<A> {
fn from(bs: &Bs) -> Self {
Seq {
_p: PhantomData,
bv: bs.into(),
}
}
}
impl<A: Codec> From<Bv> for Seq<A> {
fn from(bv: Bv) -> Self {
Seq {
_p: PhantomData,
bv,
}
}
}
#[cfg(test)]
mod tests {
use crate::prelude::*;
use crate::{Bv, Order};
use bitvec::prelude::*;
use core::borrow::Borrow;
use core::hash::{Hash, Hasher};
use core::marker::PhantomData;
use std::collections::hash_map::DefaultHasher;
#[test]
fn test_revcomp() {
let s1: Seq<Dna> = dna!("ATGTGTGCGACTGA").into();
let s2: Seq<Dna> = dna!("TCAGTCGCACACAT").into();
let s3: &SeqSlice<Dna> = &s1;
assert_eq!(s3.revcomp(), s2.revcomp().revcomp());
assert_eq!(s3.revcomp(), s2);
assert_ne!(s3.revcomp(), s2.revcomp());
assert_eq!(s3, s2.revcomp());
}
#[test]
fn test_revcomp_mismatched_sizes() {
let s1 = dna!("AAAA");
let s2 = dna!("TTTTT");
assert_ne!(s1, s2.revcomp());
}
#[test]
fn test_revcomp_idempotence() {
let s = dna!("AAACGCTACGTACGCGCCTTCGGGGCATCAGCACCAC");
let sc = dna!("AAACGCTACGTACGCGCCTTCGGGGCATCAGCACCAC");
assert_eq!(s.revcomp().revcomp(), sc);
}
#[test]
fn slice_index_comparisions() {
let s1 = dna!("ATGTGTGCGACTGATGATCAAACGTAGCTACG");
let s2 = dna!("ACGTGTGTGCTAGCTAATCGATCAAAAAG");
assert_eq!(&s1[0], &s2[0]);
assert_ne!(&s1[1], &s2[1]);
assert_eq!(&s1[2..4], &s2[2..4]);
assert_eq!(&s1[15..21], &s2[19..25]);
assert_ne!(&s1[2..20], &s2[2..20]);
}
#[test]
fn slice_indexing() {
let seq = dna!("TGCATCGAT");
assert_ne!(&seq[..], &dna!("AGCATCGAA")[..]);
assert_ne!(&seq[3..=6], &dna!("ATC")[..]);
assert_ne!(&seq[..=6], &dna!("TGCATC")[..]);
assert_ne!(&seq[4..5], &dna!("TC")[..]);
assert_ne!(&seq[..6], &dna!("TGCAT")[..]);
assert_ne!(&seq[5..], &dna!("TCGAT")[..]);
assert_eq!(&seq[..], &dna!("TGCATCGAT")[..]);
assert_eq!(&seq[3..=6], &dna!("ATCG")[..]);
assert_eq!(&seq[..=6], &dna!("TGCATCG")[..]);
assert_eq!(&seq[4..5], &dna!("T")[..]);
assert_eq!(&seq[..6], &dna!("TGCATC")[..]);
assert_eq!(&seq[5..], &dna!("CGAT")[..]);
}
#[test]
fn slice_index_ranges() {
let s1: &'static SeqSlice<Dna> = dna!("ACGACTGATCGA");
let s2: &'static SeqSlice<Dna> = dna!("TCGAACGACTGA");
assert_eq!(&s1[..8], &s2[4..]);
assert_eq!(&s1[8..], &s2[..4]);
assert_ne!(&s1[8..], &s2[8..]);
assert_ne!(&s1[..], &s2[..4]);
assert_eq!(&s1[..=7], &s2[4..]);
assert_eq!(&s1[8..], &s2[..=3]);
assert_ne!(&s1[8..11], &s2[8..=11]);
assert_ne!(&s1[..], &s2[..=4]);
}
#[test]
fn slice_nth() {
let s = dna!("ATGTGTGCGACTGATGATCAAACGTAGCTACG");
assert_eq!(s.nth(0), Dna::A);
assert_ne!(s.nth(0), Dna::G);
assert_eq!(s.nth(1), Dna::T);
assert_ne!(s.nth(1), Dna::C);
assert_eq!(s.nth(s.len() - 1), Dna::G);
assert_ne!(s.nth(s.len() - 1), Dna::C);
}
#[test]
fn slice_rangeto_and_full() {
let s1 = dna!("ATCGACTAGCATGCTACG");
let s2 = dna!("ATCGACTAG");
assert_eq!(&s1[..s2.len()], &s2[..]);
assert_ne!(&s2[..s2.len()], &s1[..]);
}
#[test]
fn from_slice() {
let s1 = dna!("ATGTGTGCGACTGATGATCAAACGTAGCTACG");
let s: &SeqSlice<Dna> = &s1[15..21];
assert_eq!(format!("{}", s), "GATCAA");
}
#[test]
fn string_to_seq() {
let seq_str = "ACTGACTG";
let seq: Result<Seq<Dna>, _> = seq_str.try_into();
assert!(seq.is_ok());
assert_eq!(seq.unwrap().to_string(), seq_str);
}
#[test]
fn invalid_string_to_seq() {
let invalid_seq_str = "ACUGACTG";
let seq: Result<Seq<Dna>, _> = invalid_seq_str.try_into();
assert!(seq.is_err());
}
#[test]
fn seq_to_string() {
let seq_str = "ACTGACTG";
let seq: Seq<Dna> = seq_str.try_into().unwrap();
let result_str: String = seq.into();
assert_eq!(result_str, seq_str);
}
#[test]
fn seqslice_to_string() {
let seq_str = "ACTGACTG";
let seq: Seq<Dna> = seq_str.try_into().unwrap();
let slice = &seq[1..5];
let result_str: String = slice.into();
assert_eq!(result_str, "CTGA");
}
#[test]
#[should_panic(expected = "range 2..18 out of bounds: 16")]
fn invalid_seqslice_to_string() {
let seq_str = "ACTGACTG";
let seq: Seq<Dna> = seq_str.try_into().unwrap();
let _ = &seq[1..9];
}
#[test]
fn test_push() {
let mut seq = Seq::<Dna>::new();
seq.push(Dna::A);
seq.push(Dna::C);
seq.push(Dna::G);
seq.push(Dna::T);
assert_eq!(seq.len(), 4);
assert_eq!(String::from(seq), "ACGT")
}
#[test]
fn test_extend_amino() {
let mut seq = Seq::<Amino>::new();
seq.push(Amino::S);
seq.push(Amino::L);
seq.extend(vec![Amino::Y, Amino::M].into_iter());
assert_eq!(seq.len(), 4);
assert_eq!(String::from(seq), "SLYM");
}
#[test]
fn test_extend() {
let mut seq = Seq::<Dna>::new();
seq.push(Dna::A);
seq.push(Dna::C);
seq.extend(vec![Dna::G, Dna::T].into_iter());
assert_eq!(seq.len(), 4);
assert_eq!(String::from(seq), "ACGT");
}
#[test]
fn test_eqs() {
let seq: Seq<Dna> = "ACTAGCATCGA".try_into().unwrap();
let seq2: Seq<Dna> = "ACTAGCATCGA".try_into().unwrap();
let slice: &SeqSlice<Dna> = &seq;
let slice2: &SeqSlice<Dna> = &seq2[..];
assert_eq!(seq, slice);
assert_eq!(seq2, slice);
assert_eq!(seq2, slice2);
assert_eq!(slice, slice2);
assert_eq!(seq, seq2);
}
#[test]
fn test_str_eqs() {
let string: String = "ACTAGCATCGA".into();
let slice: &str = "GCTGCATCGATC";
let seq1: Seq<Dna> = Seq::<Dna>::try_from(slice).unwrap();
let seq2: Seq<Dna> = Seq::<Dna>::try_from(string.clone()).unwrap();
assert_eq!(seq2.to_string(), string);
assert_eq!(seq1.to_string(), slice);
assert_ne!(seq2.to_string(), slice);
assert_ne!(seq1.to_string(), string);
}
#[test]
fn test_from_iter() {
let iter = vec![Dna::A, Dna::C, Dna::G, Dna::T].into_iter();
let seq: Seq<Dna> = Seq::from_iter(iter);
assert_eq!(seq.len(), 4);
assert_eq!(String::from(seq), "ACGT");
}
#[test]
fn test_bit_order() {
let raw: usize = 0b10_11_01_11_10_01_00_01;
let mut bv: Bv = Default::default();
bv.extend(&raw.view_bits::<Order>()[..(Dna::BITS as usize * 8)]);
let s = Seq::<Dna> {
bv,
_p: PhantomData,
};
assert_eq!(dna!("CACGTCTG").to_string(), "CACGTCTG");
assert_eq!(String::from(s), "CACGTCTG");
}
#[test]
fn test_borrow() {
let seq: Seq<Dna> = dna!("ACGACCCCCATAGATGGGCTG").into();
let slice: &SeqSlice<Dna> = seq.borrow();
assert_eq!(slice, &seq[..]);
assert_ne!(slice, &seq[1..]);
}
#[test]
fn test_deref() {
let seq: Seq<Dna> = dna!("AGAATGATCG").into();
let slice: &SeqSlice<Dna> = &*seq;
assert_eq!(slice, &seq[..]);
assert_ne!(slice, &seq[1..]);
}
#[test]
fn test_asref() {
let seq: Seq<Dna> = dna!("AGAATGATCAAAATATATATAAAG").into();
let slice: &SeqSlice<Dna> = seq.as_ref();
assert_ne!(slice, &seq[2..5]);
assert_eq!(slice, &seq[..]);
}
#[test]
fn test_to_owned() {
let seq: Seq<Dna> = dna!("AGAATGAATCG").into();
let slice: &SeqSlice<Dna> = &seq;
let owned: Seq<Dna> = slice[2..5].to_owned();
assert_eq!(&owned, &seq[2..5]);
assert_eq!(owned, seq[2..5].to_owned());
assert_ne!(&owned, &seq[..]);
}
#[test]
fn test_clone() {
let seq: Seq<Dna> = dna!("AGAATGATGGGGGGGGGGGCG").into();
let cloned = seq.clone();
assert_eq!(seq, cloned);
}
#[test]
fn test_trim() {
let seq = b"AGAATGATGGGGGGGGGGGCG";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("AGAATGATGGGGGGGGGGGCG"));
let seq = b"NNNNAGAATGATGGGGGGGGGGGCGNNNNNNNNNNN";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("AGAATGATGGGGGGGGGGGCG"));
let seq = b"NNNNAGAATGATGGGGNGGGGGGGCGNNNNNNNNNNN";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert_eq!(s, Err(ParseBioError::UnrecognisedBase(b'N')));
let seq = b"AGAATGATGGGGGGGGGGGCG";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("AGAATGATGGGGGGGGGGGCG"));
let seq = b"NNNNAGAATGATGGGGGGGGGGGCGNNNNNNNNNNN";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("AGAATGATGGGGGGGGGGGCG"));
let seq = b"NNNNAGAATGATGGGGNGGGGGGGCGNNNNNNNNNNN";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert_eq!(s, Err(ParseBioError::UnrecognisedBase(b'N')));
let seq = b"";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert!(s.is_ok());
assert_eq!(s.unwrap(), dna!(""));
let seq = b"XXXX";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert!(s.is_ok());
assert_eq!(s.unwrap(), dna!(""));
let seq = b"XXACGT";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("ACGT"));
let seq = b"ACGTXX";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("ACGT"));
let seq = b"ACGTACGTACGTACGTACGTACGT";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("ACGTACGTACGTACGTACGTACGT"));
let seq = b"XXACGTXXACGTXX";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert_eq!(s, Err(ParseBioError::UnrecognisedBase(b'X')));
let seq = b"A";
let s: Seq<Dna> = Seq::trim_u8(seq).unwrap();
assert_eq!(s, dna!("A"));
let seq = b"X";
let s: Result<Seq<Dna>, ParseBioError> = Seq::trim_u8(seq);
assert!(s.is_ok());
assert_eq!(s.unwrap(), dna!(""));
}
#[test]
fn test_seq_eq_and_hash() {
let seq1: Seq<Dna> = "ACGT".try_into().unwrap();
let seq2: Seq<Dna> = "ACGT".try_into().unwrap();
assert_eq!(seq1, seq2);
let mut hasher1 = DefaultHasher::new();
seq1.hash(&mut hasher1);
let hash1 = hasher1.finish();
let mut hasher2 = DefaultHasher::new();
seq2.hash(&mut hasher2);
let hash2 = hasher2.finish();
assert_eq!(hash1, hash2);
}
#[test]
fn test_seq_slice_eq() {
let seq1: Seq<Dna> = "ACGTAAAAAAAAAAAAACGTAAAACCCCGGGGTTTTA".try_into().unwrap();
let seq2: Seq<Dna> = "ACGTAAAAAAAAAAAAACGTAAAACCCCGGGGTTTTAA".try_into().unwrap();
let slice1a: &SeqSlice<Dna> = &seq1[..];
let slice1b: &SeqSlice<Dna> = &seq1[..];
let slice2a: &SeqSlice<Dna> = &seq2[..seq2.len() - 1];
let slice2b: &SeqSlice<Dna> = &seq2[..seq2.len() - 1];
let seq3: Seq<Dna> = slice2b.into();
assert_eq!(slice1a, slice2b);
assert_eq!(&slice2a, &slice2b);
assert_eq!(seq1, slice2a);
assert_eq!(slice1b, seq3);
assert_eq!(slice1a, slice1b);
assert_eq!(seq1, seq3);
assert_ne!(seq1, seq2);
assert_ne!(seq2, seq3);
assert_ne!(seq2, slice2a);
assert_ne!(seq2, slice1b);
assert_eq!(&slice1a, &slice1b);
assert_eq!(seq1, &seq1);
assert_eq!(seq1, &seq3);
assert_eq!(&seq1, seq3);
assert_eq!(&seq1, &seq3);
assert_eq!(slice1a, seq3);
assert_eq!(seq1, slice2a);
assert_eq!(&seq1, slice2a);
assert_eq!(&seq1, slice2a);
}
#[test]
fn test_seq_slice_hash() {
let seq1: Seq<Dna> = "ACGTAAAAAAAAAAAAACGTAAAACCCCGGGGAAAAA".try_into().unwrap();
let seq2: Seq<Dna> = "ACGTAAAAAAAAAAAAACGTAAAACCCCGGGGAAAAA".try_into().unwrap();
let seq3: Seq<Dna> = "ACGTAAAAAAAAAAAAACGTAAAACCCCGGGG".try_into().unwrap();
let slice1 = &seq1[..];
let slice2 = &seq2[..];
let slice3 = &seq3[..];
let slice1_32 = &seq1[..32];
let mut hasher1 = DefaultHasher::new();
seq1.hash(&mut hasher1);
let full1 = hasher1.finish();
let mut hasher1a = DefaultHasher::new();
seq1.hash(&mut hasher1a);
let full1_alt = hasher1a.finish();
let mut hasher2 = DefaultHasher::new();
seq2.hash(&mut hasher2);
let full2 = hasher2.finish();
let mut hasher3 = DefaultHasher::new();
slice1.hash(&mut hasher3);
let full1_slice = hasher3.finish();
let mut hasher4 = DefaultHasher::new();
slice2.hash(&mut hasher4);
let full2_slice = hasher4.finish();
let mut hasher5 = DefaultHasher::new();
slice3.hash(&mut hasher5);
let short1_slice = hasher5.finish();
let mut hasher6 = DefaultHasher::new();
slice1_32.hash(&mut hasher6);
let seq1_short = hasher6.finish();
assert_eq!(full1, full1_alt);
assert_eq!(full1, full2);
assert_ne!(full2_slice, short1_slice);
assert_eq!(full2, full1_slice);
assert_eq!(short1_slice, seq1_short);
assert_ne!(seq1_short, full1_slice);
assert_ne!(full1, short1_slice);
}
#[test]
fn test_fromstr() {
let seq: Result<Seq<Dna>, ParseBioError> =
"ACGATGAGTAGTCGCCATCGTATCTTTGACTGCCGATGCTA".parse();
assert!(seq.is_ok());
let seq: Result<Seq<Dna>, ParseBioError> =
"ACGATGAGTAGBCGCCATCGTATCTTTGACTGCCGATGCTA".parse();
assert_eq!(seq, Err(ParseBioError::UnrecognisedBase(b'B')));
}
#[test]
fn test_lens() {
assert_eq!(iupac!("AWANWATNA---SKAGTCAA").len(), 20)
}
#[test]
fn test_unique_bitarray_ident() {
let s1 = dna!("ATCGACTACGATCGCTACGATCGATCGATCGATCGAATCTCCCGCGCGATCATCGATCATCGCTACGTACGTCGAAAAATATAATGGG");
let s2 = dna!("ATCGACTACGATCGCTACGATCGATCGATCGATCGAATCTCCCGCGCGATCATCGATCATCGCTACGTACGTCGAAAAATATAATGGG");
let s3 = dna!("CTCGACTACGATCGCTACGATCGATCGATCGATCGAATCTCCCGCGCGATCATCGATCATCGCTACGTACGTCGAAAAATATAATGGG");
let s4 = dna!("ATCGACTACGATCGCTACGATCGATCGATCGATCGAATCTCCCGCGCGATCATCGATCATCGCTACGTACGTCGAAAAATATAATGGGA");
let s5 = dna!("ATCGACTACGATCGCTACGATCGATCGATCGATCGAATCTCCCGCGCGATCATCGATCATCGCTACGTACGTCGAAAAATATAATGGC");
assert_eq!(s1, s2);
assert_ne!(s1, s3);
assert_ne!(s1, s4);
assert_ne!(s4, s1);
assert_ne!(s5, s1);
}
#[test]
fn test_static() {
use crate::seq::SeqArray;
static B: SeqArray<Dna, 5, 1> = SeqArray {
_p: PhantomData,
ba: bitarr![const usize, Lsb0; 1,1,0,1,0,0,1,0,1,1],
};
let s: &'static SeqSlice<Dna> = &B;
let x: &'static str = "TGACT";
assert_eq!(s.to_string(), x);
}
#[test]
fn test_to_from_raw() {
let s = "TCAGCTAGCTACGACTGATCGATCGACTGATGCCGCGCGCGGCGCCGCGCGCGCGCGCCGCGCGCCCCGCGCGCGGCGCGCGCCGCGCGCGCGCGCGGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGCGC";
let seq: Seq<Dna> = s.try_into().unwrap();
let raw = seq.into_raw();
let new = Seq::<Dna>::from_raw(s.len(), raw);
assert_eq!(new, seq);
let bad = Seq::<Dna>::from_raw(342, raw);
assert_ne!(bad, seq);
}
}