pub struct FMDIndex<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> { /* private fields */ }
Expand description

The FMD-Index for linear time search of supermaximal exact matches on forward and reverse strand of DNA texts (Li, 2012).

Implementations§

source§

impl<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> FMDIndex<DBWT, DLess, DOcc>

source

pub fn smems( &self, pattern: &[u8], i: usize, l: usize ) -> Vec<(BiInterval, usize, usize)>

Find supermaximal exact matches (of length >= l) of given pattern that overlap position i in the pattern. Complexity O(m) with pattern of length m.

Example
use bio::alphabets::dna;
use bio::data_structures::bwt::{bwt, less, Occ};
use bio::data_structures::fmindex::{FMDIndex, FMIndex};
use bio::data_structures::suffix_array::suffix_array;

let text = b"ATTC$GAAT$";
let alphabet = dna::n_alphabet();
let sa = suffix_array(text);
let bwt = bwt(text, &sa);
let less = less(&bwt, &alphabet);
let occ = Occ::new(&bwt, 3, &alphabet);
let fm = FMIndex::new(&bwt, &less, &occ);
let fmdindex = FMDIndex::from(fm);

let pattern = b"ATT";
let intervals = fmdindex.smems(pattern, 2, 0);

let forward_positions = intervals[0].0.forward().occ(&sa);
let revcomp_positions = intervals[0].0.revcomp().occ(&sa);
let pattern_position = intervals[0].1;
let smem_len = intervals[0].2;

assert_eq!(forward_positions, [0]);
assert_eq!(revcomp_positions, [6]);
assert_eq!(pattern_position, 0);
assert_eq!(smem_len, 3);
source

pub fn all_smems( &self, pattern: &[u8], l: usize ) -> Vec<(BiInterval, usize, usize)>

Find all supermaximal exact matches (of length >= l) of given pattern. Complexity O(m^2) with pattern of length m.

Example
use bio::alphabets::dna;
use bio::data_structures::bwt::{bwt, less, Occ};
use bio::data_structures::fmindex::{FMDIndex, FMIndex};
use bio::data_structures::suffix_array::suffix_array;

let text = b"ATTCGGGG$CCCCGAAT$";
let alphabet = dna::n_alphabet();
let sa = suffix_array(text);
let bwt = bwt(text, &sa);
let less = less(&bwt, &alphabet);
let occ = Occ::new(&bwt, 3, &alphabet);
let fm = FMIndex::new(&bwt, &less, &occ);
let fmdindex = FMDIndex::from(fm);

let pattern = b"ATTGGGG";
let intervals = fmdindex.all_smems(pattern, 0);
assert_eq!(intervals.len(), 2);

let solutions = vec![[0, 14, 0, 3], [4, 9, 3, 4]];
for (i, interval) in intervals.iter().enumerate() {
    let forward_positions = interval.0.forward().occ(&sa);
    let revcomp_positions = interval.0.revcomp().occ(&sa);
    let pattern_position = interval.1;
    let smem_len = interval.2;
    assert_eq!(
        [
            forward_positions[0],
            revcomp_positions[0],
            pattern_position,
            smem_len
        ],
        solutions[i]
    );
}
source

pub fn init_interval_with(&self, a: u8) -> BiInterval

Initialize interval with given start character.

source

pub fn init_interval(&self) -> BiInterval

Initialize interval for empty pattern. The interval points at the whole suffix array.

source

pub fn backward_ext(&self, interval: &BiInterval, a: u8) -> BiInterval

Backward extension of given interval with given character.

source

pub fn forward_ext(&self, interval: &BiInterval, a: u8) -> BiInterval

source

pub unsafe fn from_fmindex_unchecked( fmindex: FMIndex<DBWT, DLess, DOcc> ) -> FMDIndex<DBWT, DLess, DOcc>

Construct a new instance of the FMD index (see Heng Li (2012) Bioinformatics) without checking whether the text is over the DNA alphabet with N. This expects a BWT that was created from a text over the DNA alphabet with N (alphabets::dna::n_alphabet()) consisting of the concatenation with its reverse complement, separated by the sentinel symbol $. I.e., let T be the original text and R be its reverse complement. Then, the expected text is T$R$. Further, multiple concatenated texts are allowed, e.g. T1$R1$T2$R2$T3$R3$. It is unsafe to construct an FMD index from an FM index that is not built on the DNA alphabet.

Trait Implementations§

source§

impl<DBWT: Clone + Borrow<BWT>, DLess: Clone + Borrow<Less>, DOcc: Clone + Borrow<Occ>> Clone for FMDIndex<DBWT, DLess, DOcc>

source§

fn clone(&self) -> FMDIndex<DBWT, DLess, DOcc>

Returns a copy of the value. Read more
1.0.0 · source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more
source§

impl<DBWT: Debug + Borrow<BWT>, DLess: Debug + Borrow<Less>, DOcc: Debug + Borrow<Occ>> Debug for FMDIndex<DBWT, DLess, DOcc>

source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
source§

impl<DBWT: Default + Borrow<BWT>, DLess: Default + Borrow<Less>, DOcc: Default + Borrow<Occ>> Default for FMDIndex<DBWT, DLess, DOcc>

source§

fn default() -> FMDIndex<DBWT, DLess, DOcc>

Returns the “default value” for a type. Read more
source§

impl<'de, DBWT, DLess, DOcc> Deserialize<'de> for FMDIndex<DBWT, DLess, DOcc>where DBWT: Deserialize<'de> + Borrow<BWT>, DLess: Deserialize<'de> + Borrow<Less>, DOcc: Deserialize<'de> + Borrow<Occ>,

source§

fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where __D: Deserializer<'de>,

Deserialize this value from the given Serde deserializer. Read more
source§

impl<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> FMIndexable for FMDIndex<DBWT, DLess, DOcc>

source§

fn bwt(&self) -> &BWT

Provide a reference to the underlying BWT.

source§

fn occ(&self, r: usize, a: u8) -> usize

Get occurrence count of symbol a in BWT[..r+1].
source§

fn less(&self, a: u8) -> usize

Also known as
Perform backward search, yielding BackwardSearchResult enum that contains the suffix array interval denoting exact occurrences of the given pattern of length m in the text if it exists, or the suffix array interval denoting the exact occurrences of a maximal matching suffix of the given pattern if it does not exist. If none of the pattern can be matched, the BackwardSearchResult is Absent. Complexity: O(m). Read more
source§

impl<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> From<FMIndex<DBWT, DLess, DOcc>> for FMDIndex<DBWT, DLess, DOcc>

source§

fn from(fmindex: FMIndex<DBWT, DLess, DOcc>) -> FMDIndex<DBWT, DLess, DOcc>

Construct a new instance of the FMD index (see Heng Li (2012) Bioinformatics). This expects a BWT that was created from a text over the DNA alphabet with N (alphabets::dna::n_alphabet()) consisting of the concatenation with its reverse complement, separated by the sentinel symbol $. I.e., let T be the original text and R be its reverse complement. Then, the expected text is T$R$. Further, multiple concatenated texts are allowed, e.g. T1$R1$T2$R2$T3$R3$.

source§

impl<DBWT: Hash + Borrow<BWT>, DLess: Hash + Borrow<Less>, DOcc: Hash + Borrow<Occ>> Hash for FMDIndex<DBWT, DLess, DOcc>

source§

fn hash<__H: Hasher>(&self, state: &mut __H)

Feeds this value into the given Hasher. Read more
1.3.0 · source§

fn hash_slice<H>(data: &[Self], state: &mut H)where H: Hasher, Self: Sized,

Feeds a slice of this type into the given Hasher. Read more
source§

impl<DBWT: Ord + Borrow<BWT>, DLess: Ord + Borrow<Less>, DOcc: Ord + Borrow<Occ>> Ord for FMDIndex<DBWT, DLess, DOcc>

source§

fn cmp(&self, other: &FMDIndex<DBWT, DLess, DOcc>) -> Ordering

This method returns an Ordering between self and other. Read more
1.21.0 · source§

fn max(self, other: Self) -> Selfwhere Self: Sized,

Compares and returns the maximum of two values. Read more
1.21.0 · source§

fn min(self, other: Self) -> Selfwhere Self: Sized,

Compares and returns the minimum of two values. Read more
1.50.0 · source§

fn clamp(self, min: Self, max: Self) -> Selfwhere Self: Sized + PartialOrd<Self>,

Restrict a value to a certain interval. Read more
source§

impl<DBWT: PartialEq + Borrow<BWT>, DLess: PartialEq + Borrow<Less>, DOcc: PartialEq + Borrow<Occ>> PartialEq<FMDIndex<DBWT, DLess, DOcc>> for FMDIndex<DBWT, DLess, DOcc>

source§

fn eq(&self, other: &FMDIndex<DBWT, DLess, DOcc>) -> bool

This method tests for self and other values to be equal, and is used by ==.
1.0.0 · source§

fn ne(&self, other: &Rhs) -> bool

This method tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.
source§

impl<DBWT: PartialOrd + Borrow<BWT>, DLess: PartialOrd + Borrow<Less>, DOcc: PartialOrd + Borrow<Occ>> PartialOrd<FMDIndex<DBWT, DLess, DOcc>> for FMDIndex<DBWT, DLess, DOcc>

source§

fn partial_cmp(&self, other: &FMDIndex<DBWT, DLess, DOcc>) -> Option<Ordering>

This method returns an ordering between self and other values if one exists. Read more
1.0.0 · source§

fn lt(&self, other: &Rhs) -> bool

This method tests less than (for self and other) and is used by the < operator. Read more
1.0.0 · source§

fn le(&self, other: &Rhs) -> bool

This method tests less than or equal to (for self and other) and is used by the <= operator. Read more
1.0.0 · source§

fn gt(&self, other: &Rhs) -> bool

This method tests greater than (for self and other) and is used by the > operator. Read more
1.0.0 · source§

fn ge(&self, other: &Rhs) -> bool

This method tests greater than or equal to (for self and other) and is used by the >= operator. Read more
source§

impl<DBWT, DLess, DOcc> Serialize for FMDIndex<DBWT, DLess, DOcc>where DBWT: Serialize + Borrow<BWT>, DLess: Serialize + Borrow<Less>, DOcc: Serialize + Borrow<Occ>,

source§

fn serialize<__S>(&self, __serializer: __S) -> Result<__S::Ok, __S::Error>where __S: Serializer,

Serialize this value into the given Serde serializer. Read more
source§

impl<DBWT: Copy + Borrow<BWT>, DLess: Copy + Borrow<Less>, DOcc: Copy + Borrow<Occ>> Copy for FMDIndex<DBWT, DLess, DOcc>

source§

impl<DBWT: Eq + Borrow<BWT>, DLess: Eq + Borrow<Less>, DOcc: Eq + Borrow<Occ>> Eq for FMDIndex<DBWT, DLess, DOcc>

source§

impl<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> StructuralEq for FMDIndex<DBWT, DLess, DOcc>

source§

impl<DBWT: Borrow<BWT>, DLess: Borrow<Less>, DOcc: Borrow<Occ>> StructuralPartialEq for FMDIndex<DBWT, DLess, DOcc>

Auto Trait Implementations§

§

impl<DBWT, DLess, DOcc> RefUnwindSafe for FMDIndex<DBWT, DLess, DOcc>where DBWT: RefUnwindSafe, DLess: RefUnwindSafe, DOcc: RefUnwindSafe,

§

impl<DBWT, DLess, DOcc> Send for FMDIndex<DBWT, DLess, DOcc>where DBWT: Send, DLess: Send, DOcc: Send,

§

impl<DBWT, DLess, DOcc> Sync for FMDIndex<DBWT, DLess, DOcc>where DBWT: Sync, DLess: Sync, DOcc: Sync,

§

impl<DBWT, DLess, DOcc> Unpin for FMDIndex<DBWT, DLess, DOcc>where DBWT: Unpin, DLess: Unpin, DOcc: Unpin,

§

impl<DBWT, DLess, DOcc> UnwindSafe for FMDIndex<DBWT, DLess, DOcc>where DBWT: UnwindSafe, DLess: UnwindSafe, DOcc: UnwindSafe,

Blanket Implementations§

source§

impl<T> Any for Twhere T: 'static + ?Sized,

source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
source§

impl<T> Borrow<T> for Twhere T: ?Sized,

source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
source§

impl<T> BorrowMut<T> for Twhere T: ?Sized,

source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
source§

impl<Q, K> Equivalent<K> for Qwhere Q: Eq + ?Sized, K: Borrow<Q> + ?Sized,

source§

fn equivalent(&self, key: &K) -> bool

Compare self to key and return true if they are equal.
source§

impl<T> From<T> for T

source§

fn from(t: T) -> T

Returns the argument unchanged.

source§

impl<T, U> Into<U> for Twhere U: From<T>,

source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

source§

impl<T> Same<T> for T

§

type Output = T

Should always be Self
§

impl<SS, SP> SupersetOf<SS> for SPwhere SS: SubsetOf<SP>,

§

fn to_subset(&self) -> Option<SS>

The inverse inclusion map: attempts to construct self from the equivalent element of its superset. Read more
§

fn is_in_subset(&self) -> bool

Checks if self is actually part of its subset T (and can be converted to it).
§

fn to_subset_unchecked(&self) -> SS

Use with care! Same as self.to_subset but without any property checks. Always succeeds.
§

fn from_subset(element: &SS) -> SP

The inclusion map: converts self to the equivalent element of its superset.
source§

impl<T> ToOwned for Twhere T: Clone,

§

type Owned = T

The resulting type after obtaining ownership.
source§

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more
source§

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more
source§

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

§

type Error = Infallible

The type returned in the event of a conversion error.
source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
source§

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
§

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

§

fn vzip(self) -> V

source§

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

source§

impl<N> NodeTrait for Nwhere N: Copy + Ord + Hash,

source§

impl<T> Scalar for Twhere T: 'static + Clone + PartialEq<T> + Debug,