fractal 0.7.1 - Docs.rs

//! Multiscale modeling framework for the analysis and synthesis of
//! positive-valued, long-range-dependent processes.
//!
//! ## References
//!
//! 1. R. H. Riedi, M. Crouse, V. Ribeiro, and R. Baraniuk, “[A multifractal
//!    wavelet model with application to network traffic][1],” IEEE Transactions
//!    on Information Theory, vol. 45, no. 3, pp. 992–1018, April 1999.
//!
//! [1]: http://dx.doi.org/10.1109/18.761337

// The implementation is based on:
// http://dsp.rice.edu/software/multifractal-wavelet-model

#[cfg(test)]
extern crate assert;

extern crate dwt;
extern crate probability;
extern crate statistics;

use probability::distribution::Beta as Pearson;
use probability::distribution::{Gaussian, Sample};
use probability::source::Source;
use std::{error, fmt};

/// An error.
pub struct Error(pub &'static str);

/// A result.
pub type Result<T> = std::result::Result<T, Error>;

/// A multifractal wavelet model with beta-distributed multipliers.
pub struct Beta {
    gaussian: Gaussian,
    betas: Vec<Pearson>,
}

macro_rules! raise(($message:expr) => (return Err(Error($message))));

macro_rules! blocks(
    ($number:expr) => (if $number == 0 {
        raise!("the number of blocks should be at least two");
    });
);

macro_rules! scales(
    ($number:expr) => (if $number == 0 {
        raise!("the number of scales should be positive");
    });
);

impl Beta {
    /// Fit the model to the data.
    ///
    /// The number of points used for the analysis is `blocks × 2^scales`. The
    /// parameter `blocks` should be at least two, and it corresponds to the
    /// number of points used for the estimation of the mean and standard
    /// deviation of the underlying process. The parameter `scales` should be at
    /// least one, and it corresponds to the number of scales for which the data
    /// are analyzed. The number `scales` also dictates the size of a sample
    /// drawn by `sample`, namely, each sample contains `2^scales` elements.
    pub fn new(data: &[f64], blocks: usize) -> Result<Self> {
        blocks!(blocks);
        let scales = (data.len() as f64 / blocks as f64).log2().floor() as usize;
        scales!(scales);
        Beta::fit(data, blocks, scales)
    }

    /// Fit the model to the data with a specific number of scales.
    ///
    /// The function is identical to `new` except for specifying the number of
    /// scales instead of the number of blocks.
    pub fn with_scales(data: &[f64], scales: usize) -> Result<Self> {
        scales!(scales);
        let blocks = (data.len() as f64 / (1 << scales) as f64).floor() as usize;
        blocks!(blocks);
        Beta::fit(data, blocks, scales)
    }

    /// Draw a sample.
    pub fn sample<S>(&self, source: &mut S) -> Result<Vec<f64>> where S: Source {
        let nscale = self.betas.len();
        let mut data = Vec::with_capacity(1 << nscale);
        unsafe { data.set_len(1 << nscale) };
        let scale = 0.5f64.powf(nscale as f64 / 2.0);
        let z = scale * self.gaussian.sample(source);
        if z < 0.0 {
            raise!("the model is not appropriate for the data");
        }
        data[0] = z;
        for i in 0..nscale {
            for j in (0..(1 << i)).rev() {
                let x = data[j];
                let a = self.betas[i].sample(source);
                data[2 * j + 0] = (1.0 + a) * x;
                data[2 * j + 1] = (1.0 - a) * x;
            }
        }
        Ok(data)
    }

    fn fit(data: &[f64], blocks: usize, scales: usize) -> Result<Self> {
        use dwt::{Operation, Transform};
        use dwt::wavelet::Haar;
        use statistics::{mean, variance};

        let mut data = (&data[0..(blocks * (1 << scales))]).to_vec();
        data.transform(Operation::Forward, &Haar::new(), scales);
        let gaussian = Gaussian::new(mean(&data[0..blocks]), variance(&data[0..blocks]).sqrt());
        let mut beta = 0.0;
        let mut ms = mean_square(&data[0..blocks]);
        let mut betas = Vec::with_capacity(scales);
        for i in 0..scales {
            let new_ms = mean_square(&data[(blocks * (1 << i))..(blocks * (1 << (i + 1)))]);
            beta = 0.5 * (ms / new_ms) * (beta + 1.0) - 0.5;
            if beta <= 0.0 {
                raise!("the model is not appropriate for the data");
            }
            betas.push(Pearson::new(beta, beta, -1.0, 1.0));
            ms = new_ms;
        }
        Ok(Beta { gaussian: gaussian, betas: betas })
    }
}

impl error::Error for Error {
    #[inline]
    fn description(&self) -> &str {
        &self.0
    }
}

impl fmt::Debug for Error {
    #[inline]
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(formatter)
    }
}

impl fmt::Display for Error {
    #[inline]
    fn fmt(&self, formatter: &mut fmt::Formatter) -> fmt::Result {
        self.0.fmt(formatter)
    }
}

#[inline]
fn mean_square(data: &[f64]) -> f64 {
    &data.iter().fold(0.0, |sum, &x| sum + x * x) / data.len() as f64
}

#[cfg(test)]
mod tests {
    use assert;
    use probability::source;

    use Beta;

    #[test]
    fn new() {
        let data = [
            4.018080337519417e-01, 7.596669169084191e-02, 2.399161535536580e-01,
            1.233189348351655e-01, 1.839077882824167e-01, 2.399525256649028e-01,
            4.172670690843695e-01, 4.965443032574213e-02, 9.027161099152811e-01,
            9.447871897216460e-01, 4.908640924680799e-01, 4.892526384000189e-01,
            3.377194098213772e-01, 9.000538464176620e-01, 3.692467811202150e-01,
            1.112027552937874e-01, 7.802520683211379e-01, 3.897388369612534e-01,
            2.416912859138327e-01, 4.039121455881147e-01, 9.645452516838859e-02,
            1.319732926063351e-01, 9.420505907754851e-01, 9.561345402298023e-01,
            5.752085950784656e-01, 5.977954294715582e-02, 2.347799133724063e-01,
            3.531585712220711e-01, 8.211940401979591e-01, 1.540343765155505e-02,
            4.302380165780784e-02, 1.689900294627044e-01, 6.491154749564521e-01,
            7.317223856586703e-01, 6.477459631363067e-01, 4.509237064309449e-01,
            5.470088922863450e-01, 2.963208056077732e-01, 7.446928070741562e-01,
            1.889550150325445e-01, 6.867754333653150e-01, 1.835111557372697e-01,
        ];

        let model = Beta::new(&data, 5).unwrap();

        assert::close(&model.betas.iter().map(|beta| beta.beta()).collect::<Vec<_>>(), &[
            1.635153583946054e+01, 2.793188701574629e+00, 3.739374677617142e+00,
        ], 1e-14);
        assert::close(model.gaussian.mu(), 1.184252871226982e+00, 1e-14);
        assert::close(model.gaussian.sigma(), 4.466592147518644e-01, 1e-14);
    }

    #[test]
    fn sample() {
        let data = [
            4.983640519821430e-01, 9.597439585160811e-01, 3.403857266661332e-01,
            5.852677509797773e-01, 2.238119394911370e-01, 7.512670593056529e-01,
            2.550951154592691e-01, 5.059570516651424e-01, 6.990767226566860e-01,
            8.909032525357985e-01, 9.592914252054443e-01, 5.472155299638031e-01,
            1.386244428286791e-01, 1.492940055590575e-01, 2.575082541237365e-01,
            8.407172559836625e-01, 2.542821789715310e-01, 8.142848260688164e-01,
            2.435249687249893e-01, 9.292636231872278e-01, 3.499837659848087e-01,
            1.965952504312082e-01, 2.510838579760311e-01, 6.160446761466392e-01,
            4.732888489027293e-01, 3.516595070629968e-01, 8.308286278962909e-01,
            5.852640911527243e-01, 5.497236082911395e-01, 9.171936638298100e-01,
            2.858390188203735e-01, 7.572002291107213e-01, 7.537290942784953e-01,
            3.804458469753567e-01, 5.678216407252211e-01, 7.585428956306361e-02,
            5.395011866660715e-02, 5.307975530089727e-01, 7.791672301020112e-01,
            9.340106842291830e-01, 1.299062084737301e-01, 5.688236608721927e-01,
        ];

        let model = Beta::with_scales(&data, 3).unwrap();
        let data = model.sample(&mut source::default()).unwrap();

        assert_eq!(data.len(), 8);
    }
}